From 817ead3aed90bad8c6bd38063ec8bdfcacb4ff5f Mon Sep 17 00:00:00 2001
From: crusaderky <crusaderky@gmail.com>
Date: Tue, 30 Aug 2022 17:11:35 +0100
Subject: [PATCH] Document Scheduler and Worker state machine (#6948)

---
 distributed/worker_state_machine.py           |  39 +-
 docs/source/images/run_dot.sh                 |   9 +
 docs/source/images/task-state.dot             |   7 +-
 docs/source/images/task-state.svg             | 150 +++---
 docs/source/images/worker-cancel-state1.dot   |  21 +
 docs/source/images/worker-cancel-state1.svg   | 109 +++++
 docs/source/images/worker-cancel-state2.dot   |  21 +
 docs/source/images/worker-cancel-state2.svg   | 109 +++++
 docs/source/images/worker-dep-state.dot       |   5 +-
 docs/source/images/worker-dep-state.svg       |  75 +--
 ...ask-state.dot => worker-execute-state.dot} |   6 +-
 docs/source/images/worker-execute-state.svg   | 138 ++++++
 docs/source/images/worker-forget-state.dot    |  15 +
 docs/source/images/worker-forget-state.svg    |  79 +++
 docs/source/images/worker-scatter-state.dot   |   7 +
 docs/source/images/worker-scatter-state.svg   |  30 ++
 docs/source/images/worker-state-machine.dot   |  55 +++
 docs/source/images/worker-state-machine.svg   | 127 +++++
 docs/source/images/worker-task-state.svg      | 103 ----
 docs/source/index.rst                         |   1 +
 docs/source/scheduling-state.rst              | 159 ++++--
 docs/source/worker-state.rst                  | 459 ++++++++++++++++++
 docs/source/worker.rst                        |  75 +--
 23 files changed, 1446 insertions(+), 353 deletions(-)
 create mode 100755 docs/source/images/run_dot.sh
 create mode 100644 docs/source/images/worker-cancel-state1.dot
 create mode 100644 docs/source/images/worker-cancel-state1.svg
 create mode 100644 docs/source/images/worker-cancel-state2.dot
 create mode 100644 docs/source/images/worker-cancel-state2.svg
 rename docs/source/images/{worker-task-state.dot => worker-execute-state.dot} (64%)
 create mode 100644 docs/source/images/worker-execute-state.svg
 create mode 100644 docs/source/images/worker-forget-state.dot
 create mode 100644 docs/source/images/worker-forget-state.svg
 create mode 100644 docs/source/images/worker-scatter-state.dot
 create mode 100644 docs/source/images/worker-scatter-state.svg
 create mode 100644 docs/source/images/worker-state-machine.dot
 create mode 100644 docs/source/images/worker-state-machine.svg
 delete mode 100644 docs/source/images/worker-task-state.svg
 create mode 100644 docs/source/worker-state.rst

diff --git a/distributed/worker_state_machine.py b/distributed/worker_state_machine.py
index 88d2e93692..431c8d9a8c 100644
--- a/distributed/worker_state_machine.py
+++ b/distributed/worker_state_machine.py
@@ -238,9 +238,10 @@ class TaskState:
 
     #: The current state of the task
     state: TaskStateState = "released"
-    #: The previous state of the task. It is not None iff state in (cancelled, resumed).
+    #: The previous state of the task. It is not None iff :attr:`state` in
+    #: (cancelled, resumed).
     previous: Literal["executing", "long-running", "flight", None] = None
-    #: The next state of the task. It is not None iff state == resumed.
+    #: The next state of the task. It is not None iff :attr:`state` == resumed.
     next: Literal["fetch", "waiting", None] = None
 
     #: Expected duration of the task
@@ -278,7 +279,9 @@ class TaskState:
     nbytes: int | None = None
     #: Arbitrary task annotations
     annotations: dict | None = None
-    #: True if the task is in memory or erred; False otherwise
+    #: True if the :meth:`~WorkerBase.execute` or :meth:`~WorkerBase.gather_dep`
+    #: coroutine servicing this task completed; False otherwise. This flag changes
+    #: the behaviour of transitions out of the ``executing``, ``flight`` etc. states.
     done: bool = False
 
     _instances: ClassVar[weakref.WeakSet[TaskState]] = weakref.WeakSet()
@@ -563,7 +566,10 @@ class StealResponseMsg(SendMessageToScheduler):
 
 @dataclass
 class StateMachineEvent:
+    """Base abstract class for all stimuli that can modify the worker state"""
+
     __slots__ = ("stimulus_id", "handled")
+    #: Unique ID of the event
     stimulus_id: str
     #: timestamp of when the event was handled by the worker
     # TODO Switch to @dataclass(slots=True), uncomment the line below, and remove the
@@ -572,6 +578,7 @@ class StateMachineEvent:
     _classes: ClassVar[dict[str, type[StateMachineEvent]]] = {}
 
     def __new__(cls, *args: Any, **kwargs: Any) -> StateMachineEvent:
+        """Hack to initialize the ``handled`` attribute in Python <3.10"""
         self = object.__new__(cls)
         self.handled = None
         return self
@@ -1127,11 +1134,11 @@ class WorkerState:
     #: All and only tasks with ``TaskState.state == 'missing'``.
     missing_dep_flight: set[TaskState]
 
-    #: Which tasks that are coming to us in current peer-to-peer connections.
-    #: This set includes exclusively:
-    #: - tasks with :attr:`state` == 'flight'
-    #: - tasks with :attr:`state` in ('cancelled', 'resumed') and
-    #:   :attr:`previous` == 'flight`
+    #: Tasks that are coming to us in current peer-to-peer connections.
+    #:
+    #: This set includes exclusively tasks with :attr:`~TaskState.state` == 'flight' as
+    #: well as tasks with :attr:`~TaskState.state` in ('cancelled', 'resumed') and
+    #: :attr:`~TaskState.previous` == 'flight`.
     #:
     #: See also :meth:`in_flight_tasks_count`.
     in_flight_tasks: set[TaskState]
@@ -1176,10 +1183,10 @@ class WorkerState:
     available_resources: dict[str, float]
 
     #: Set of tasks that are currently running.
-    #: This set includes exclusively:
-    #: - tasks with :attr:`state` == 'executing'
-    #: - tasks with :attr:`state` in ('cancelled', 'resumed') and
-    #:   :attr:`previous` == 'executing`
+    #:
+    #: This set includes exclusively tasks with :attr:`~TaskState.state` == 'executing'
+    #: as well as tasks with :attr:`~TaskState.state` in ('cancelled', 'resumed') and
+    #: :attr:`~TaskState.previous` == 'executing`.
     #:
     #: See also :meth:`executing_count` and :attr:`long_running`.
     executing: set[TaskState]
@@ -1188,11 +1195,11 @@ class WorkerState:
     #: :func:`~distributed.secede`, so they no longer count towards the maximum number
     #: of concurrent tasks (nthreads).
     #: These tasks do not appear in the :attr:`executing` set.
-    #: This set includes exclusively:
-    #: - tasks with :attr:`state` == 'long-running'
-    #: - tasks with :attr:`state` in ('cancelled', 'resumed') and
-    #:   :attr:`previous` == 'long-running`
     #:
+    #: This set includes exclusively tasks with
+    #: :attr:`~TaskState.state` == 'long-running' as well as tasks with
+    #: :attr:`~TaskState.state` in ('cancelled', 'resumed') and
+    #: :attr:`~TaskState.previous` == 'long-running`.
     long_running: set[TaskState]
 
     #: A number of tasks that this worker has run in its lifetime; this includes failed
diff --git a/docs/source/images/run_dot.sh b/docs/source/images/run_dot.sh
new file mode 100755
index 0000000000..9caf0c338f
--- /dev/null
+++ b/docs/source/images/run_dot.sh
@@ -0,0 +1,9 @@
+#!/usr/bin/env bash
+
+set -o errexit
+
+for in_fname in *.dot
+do
+  out_fname=${in_fname%.dot}.svg
+  dot -Tsvg $in_fname > $out_fname
+done
diff --git a/docs/source/images/task-state.dot b/docs/source/images/task-state.dot
index 52ec18ff57..fde7d8c62c 100644
--- a/docs/source/images/task-state.dot
+++ b/docs/source/images/task-state.dot
@@ -5,15 +5,12 @@ digraph{
         ];
     released1 [label=released];
     released2 [label=released];
-    new -> released1;
     released1 -> waiting;
     waiting -> processing;
-    waiting -> "no-worker";
-    "no-worker" -> waiting;
-    "no-worker" -> processing;
+    waiting -> "no-worker" [dir=both];
     processing -> memory;
     processing -> error;
-    error -> forgotten;
+    error -> released2;
     memory -> released2;
     released2 -> forgotten;
 }
diff --git a/docs/source/images/task-state.svg b/docs/source/images/task-state.svg
index 49e6e81c98..7b7d5c84ad 100644
--- a/docs/source/images/task-state.svg
+++ b/docs/source/images/task-state.svg
@@ -1,113 +1,109 @@
 <?xml version="1.0" encoding="UTF-8" standalone="no"?>
 <!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN"
  "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
-<!-- Generated by graphviz version 2.36.0 (20140111.2315)
+<!-- Generated by graphviz version 3.0.0 (20220315.2325)
  -->
-<!-- Title: %3 Pages: 1 -->
-<svg width="908pt" height="98pt"
- viewBox="0.00 0.00 908.00 98.00" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink">
-<g id="graph0" class="graph" transform="scale(1 1) rotate(0) translate(4 94)">
-<title>%3</title>
-<polygon fill="#ffffff" fill-opacity="0.941176" stroke="none" points="-4,4 -4,-94 904,-94 904,4 -4,4"/>
+<!-- Pages: 1 -->
+<svg width="807pt" height="125pt"
+ viewBox="0.00 0.00 806.75 125.00" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink">
+<g id="graph0" class="graph" transform="scale(1 1) rotate(0) translate(4 121)">
+<polygon fill="#ffffff" fill-opacity="0.941176" stroke="transparent" points="-4,4 -4,-121 802.75,-121 802.75,4 -4,4"/>
 <!-- released1 -->
-<g id="node1" class="node"><title>released1</title>
-<ellipse fill="none" stroke="black" cx="130" cy="-20" rx="39.7935" ry="18"/>
-<text text-anchor="middle" x="130" y="-16.3" font-family="Times,serif" font-size="14.00">released</text>
+<g id="node1" class="node">
+<title>released1</title>
+<ellipse fill="none" stroke="black" cx="50.05" cy="-45" rx="50.09" ry="18"/>
+<text text-anchor="middle" x="50.05" y="-41.3" font-family="Times,serif" font-size="14.00">released</text>
 </g>
 <!-- waiting -->
-<g id="node4" class="node"><title>waiting</title>
-<ellipse fill="none" stroke="black" cx="243" cy="-20" rx="37.0935" ry="18"/>
-<text text-anchor="middle" x="243" y="-16.3" font-family="Times,serif" font-size="14.00">waiting</text>
+<g id="node3" class="node">
+<title>waiting</title>
+<ellipse fill="none" stroke="black" cx="181.59" cy="-45" rx="45.49" ry="18"/>
+<text text-anchor="middle" x="181.59" y="-41.3" font-family="Times,serif" font-size="14.00">waiting</text>
 </g>
 <!-- released1&#45;&gt;waiting -->
-<g id="edge2" class="edge"><title>released1&#45;&gt;waiting</title>
-<path fill="none" stroke="black" d="M169.822,-20C178.089,-20 186.901,-20 195.424,-20"/>
-<polygon fill="black" stroke="black" points="195.621,-23.5001 205.621,-20 195.621,-16.5001 195.621,-23.5001"/>
+<g id="edge1" class="edge">
+<title>released1&#45;&gt;waiting</title>
+<path fill="none" stroke="black" d="M100.39,-45C108.73,-45 117.42,-45 125.89,-45"/>
+<polygon fill="black" stroke="black" points="126.05,-48.5 136.05,-45 126.05,-41.5 126.05,-48.5"/>
 </g>
 <!-- released2 -->
-<g id="node2" class="node"><title>released2</title>
-<ellipse fill="none" stroke="black" cx="738" cy="-72" rx="39.7935" ry="18"/>
-<text text-anchor="middle" x="738" y="-68.3" font-family="Times,serif" font-size="14.00">released</text>
+<g id="node2" class="node">
+<title>released2</title>
+<ellipse fill="none" stroke="black" cx="604.81" cy="-72" rx="50.09" ry="18"/>
+<text text-anchor="middle" x="604.81" y="-68.3" font-family="Times,serif" font-size="14.00">released</text>
 </g>
 <!-- forgotten -->
-<g id="node9" class="node"><title>forgotten</title>
-<ellipse fill="none" stroke="black" cx="857" cy="-45" rx="42.7926" ry="18"/>
-<text text-anchor="middle" x="857" y="-41.3" font-family="Times,serif" font-size="14.00">forgotten</text>
+<g id="node8" class="node">
+<title>forgotten</title>
+<ellipse fill="none" stroke="black" cx="744.8" cy="-72" rx="53.89" ry="18"/>
+<text text-anchor="middle" x="744.8" y="-68.3" font-family="Times,serif" font-size="14.00">forgotten</text>
 </g>
 <!-- released2&#45;&gt;forgotten -->
-<g id="edge11" class="edge"><title>released2&#45;&gt;forgotten</title>
-<path fill="none" stroke="black" d="M773.787,-63.9722C784.944,-61.3976 797.485,-58.5034 809.348,-55.7658"/>
-<polygon fill="black" stroke="black" points="810.152,-59.1725 819.108,-53.5134 808.578,-52.3517 810.152,-59.1725"/>
-</g>
-<!-- new -->
-<g id="node3" class="node"><title>new</title>
-<ellipse fill="none" stroke="black" cx="27" cy="-20" rx="27" ry="18"/>
-<text text-anchor="middle" x="27" y="-16.3" font-family="Times,serif" font-size="14.00">new</text>
-</g>
-<!-- new&#45;&gt;released1 -->
-<g id="edge1" class="edge"><title>new&#45;&gt;released1</title>
-<path fill="none" stroke="black" d="M54.01,-20C61.9937,-20 71.0549,-20 80.0504,-20"/>
-<polygon fill="black" stroke="black" points="80.1178,-23.5001 90.1178,-20 80.1178,-16.5001 80.1178,-23.5001"/>
+<g id="edge8" class="edge">
+<title>released2&#45;&gt;forgotten</title>
+<path fill="none" stroke="black" d="M655.24,-72C663.37,-72 671.91,-72 680.33,-72"/>
+<polygon fill="black" stroke="black" points="680.51,-75.5 690.51,-72 680.51,-68.5 680.51,-75.5"/>
 </g>
 <!-- processing -->
-<g id="node5" class="node"><title>processing</title>
-<ellipse fill="none" stroke="black" cx="496" cy="-43" rx="48.1917" ry="18"/>
-<text text-anchor="middle" x="496" y="-39.3" font-family="Times,serif" font-size="14.00">processing</text>
+<g id="node4" class="node">
+<title>processing</title>
+<ellipse fill="none" stroke="black" cx="324.18" cy="-72" rx="61.19" ry="18"/>
+<text text-anchor="middle" x="324.18" y="-68.3" font-family="Times,serif" font-size="14.00">processing</text>
 </g>
 <!-- waiting&#45;&gt;processing -->
-<g id="edge3" class="edge"><title>waiting&#45;&gt;processing</title>
-<path fill="none" stroke="black" d="M270.024,-32.3439C283.432,-38.0304 300.237,-44.1416 316,-47 357.199,-54.4709 404.602,-52.9722 440.272,-49.8747"/>
-<polygon fill="black" stroke="black" points="440.846,-53.3364 450.475,-48.9178 440.192,-46.3669 440.846,-53.3364"/>
+<g id="edge2" class="edge">
+<title>waiting&#45;&gt;processing</title>
+<path fill="none" stroke="black" d="M222.87,-52.74C235.22,-55.11 249.1,-57.77 262.49,-60.35"/>
+<polygon fill="black" stroke="black" points="262.13,-63.84 272.61,-62.29 263.45,-56.97 262.13,-63.84"/>
 </g>
 <!-- no&#45;worker -->
-<g id="node6" class="node"><title>no&#45;worker</title>
-<ellipse fill="none" stroke="black" cx="364" cy="-20" rx="47.3916" ry="18"/>
-<text text-anchor="middle" x="364" y="-16.3" font-family="Times,serif" font-size="14.00">no&#45;worker</text>
+<g id="node5" class="node">
+<title>no&#45;worker</title>
+<ellipse fill="none" stroke="black" cx="324.18" cy="-18" rx="57.69" ry="18"/>
+<text text-anchor="middle" x="324.18" y="-14.3" font-family="Times,serif" font-size="14.00">no&#45;worker</text>
 </g>
 <!-- waiting&#45;&gt;no&#45;worker -->
-<g id="edge4" class="edge"><title>waiting&#45;&gt;no&#45;worker</title>
-<path fill="none" stroke="black" d="M278.101,-13.8294C287.885,-13.355 298.798,-13.172 309.454,-13.2801"/>
-<polygon fill="black" stroke="black" points="309.481,-16.7812 319.546,-13.4731 309.615,-9.78247 309.481,-16.7812"/>
+<g id="edge3" class="edge">
+<title>waiting&#45;&gt;no&#45;worker</title>
+<path fill="none" stroke="black" d="M233,-35.32C243.28,-33.34 254.17,-31.25 264.7,-29.23"/>
+<polygon fill="black" stroke="black" points="232.04,-31.94 222.87,-37.26 233.36,-38.81 232.04,-31.94"/>
+<polygon fill="black" stroke="black" points="265.5,-32.64 274.66,-27.32 264.18,-25.77 265.5,-32.64"/>
 </g>
 <!-- memory -->
-<g id="node7" class="node"><title>memory</title>
-<ellipse fill="none" stroke="black" cx="621" cy="-70" rx="40.8928" ry="18"/>
-<text text-anchor="middle" x="621" y="-66.3" font-family="Times,serif" font-size="14.00">memory</text>
+<g id="node6" class="node">
+<title>memory</title>
+<ellipse fill="none" stroke="black" cx="470.02" cy="-99" rx="48.99" ry="18"/>
+<text text-anchor="middle" x="470.02" y="-95.3" font-family="Times,serif" font-size="14.00">memory</text>
 </g>
 <!-- processing&#45;&gt;memory -->
-<g id="edge7" class="edge"><title>processing&#45;&gt;memory</title>
-<path fill="none" stroke="black" d="M537.957,-51.9906C549.416,-54.506 561.95,-57.2573 573.695,-59.8355"/>
-<polygon fill="black" stroke="black" points="573.248,-63.3207 583.766,-62.0463 574.749,-56.4835 573.248,-63.3207"/>
+<g id="edge4" class="edge">
+<title>processing&#45;&gt;memory</title>
+<path fill="none" stroke="black" d="M376.3,-81.6C389.17,-84.01 403.01,-86.61 415.97,-89.04"/>
+<polygon fill="black" stroke="black" points="415.67,-92.55 426.14,-90.95 416.96,-85.67 415.67,-92.55"/>
 </g>
 <!-- error -->
-<g id="node8" class="node"><title>error</title>
-<ellipse fill="none" stroke="black" cx="738" cy="-18" rx="27.8951" ry="18"/>
-<text text-anchor="middle" x="738" y="-14.3" font-family="Times,serif" font-size="14.00">error</text>
+<g id="node7" class="node">
+<title>error</title>
+<ellipse fill="none" stroke="black" cx="470.02" cy="-45" rx="34.39" ry="18"/>
+<text text-anchor="middle" x="470.02" y="-41.3" font-family="Times,serif" font-size="14.00">error</text>
 </g>
 <!-- processing&#45;&gt;error -->
-<g id="edge8" class="edge"><title>processing&#45;&gt;error</title>
-<path fill="none" stroke="black" d="M542.424,-38.2683C588.151,-33.5051 657.813,-26.2486 700.201,-21.8332"/>
-<polygon fill="black" stroke="black" points="700.775,-25.2925 710.359,-20.7751 700.05,-18.3301 700.775,-25.2925"/>
-</g>
-<!-- no&#45;worker&#45;&gt;waiting -->
-<g id="edge5" class="edge"><title>no&#45;worker&#45;&gt;waiting</title>
-<path fill="none" stroke="black" d="M319.546,-26.5269C309.303,-26.8182 298.375,-26.8242 288.103,-26.545"/>
-<polygon fill="black" stroke="black" points="288.225,-23.0472 278.101,-26.1706 287.963,-30.0423 288.225,-23.0472"/>
-</g>
-<!-- no&#45;worker&#45;&gt;processing -->
-<g id="edge6" class="edge"><title>no&#45;worker&#45;&gt;processing</title>
-<path fill="none" stroke="black" d="M407.207,-27.4674C418.332,-29.4356 430.476,-31.5842 442.087,-33.6384"/>
-<polygon fill="black" stroke="black" points="441.657,-37.1166 452.114,-35.4124 442.876,-30.2237 441.657,-37.1166"/>
+<g id="edge5" class="edge">
+<title>processing&#45;&gt;error</title>
+<path fill="none" stroke="black" d="M376.3,-62.4C392.99,-59.27 411.32,-55.83 427.24,-52.84"/>
+<polygon fill="black" stroke="black" points="428.13,-56.24 437.31,-50.95 426.84,-49.36 428.13,-56.24"/>
 </g>
 <!-- memory&#45;&gt;released2 -->
-<g id="edge10" class="edge"><title>memory&#45;&gt;released2</title>
-<path fill="none" stroke="black" d="M662.221,-70.6995C670.51,-70.8437 679.327,-70.997 687.89,-71.1459"/>
-<polygon fill="black" stroke="black" points="688.097,-74.6499 698.156,-71.3245 688.219,-67.651 688.097,-74.6499"/>
-</g>
-<!-- error&#45;&gt;forgotten -->
-<g id="edge9" class="edge"><title>error&#45;&gt;forgotten</title>
-<path fill="none" stroke="black" d="M764.676,-23.9253C777.699,-26.9305 793.93,-30.6761 809.081,-34.1726"/>
-<polygon fill="black" stroke="black" points="808.306,-37.5857 818.837,-36.424 809.88,-30.765 808.306,-37.5857"/>
+<g id="edge7" class="edge">
+<title>memory&#45;&gt;released2</title>
+<path fill="none" stroke="black" d="M513.03,-90.46C525.03,-88.02 538.25,-85.33 550.8,-82.78"/>
+<polygon fill="black" stroke="black" points="551.59,-86.19 560.7,-80.77 550.2,-79.33 551.59,-86.19"/>
+</g>
+<!-- error&#45;&gt;released2 -->
+<g id="edge6" class="edge">
+<title>error&#45;&gt;released2</title>
+<path fill="none" stroke="black" d="M502.49,-51.4C516.91,-54.33 534.39,-57.89 550.76,-61.21"/>
+<polygon fill="black" stroke="black" points="550.26,-64.68 560.76,-63.25 551.66,-57.82 550.26,-64.68"/>
 </g>
 </g>
 </svg>
diff --git a/docs/source/images/worker-cancel-state1.dot b/docs/source/images/worker-cancel-state1.dot
new file mode 100644
index 0000000000..72dc1fb881
--- /dev/null
+++ b/docs/source/images/worker-cancel-state1.dot
@@ -0,0 +1,21 @@
+digraph{
+    graph [
+        bgcolor="#FFFFFFF00",
+        rankdir=LR,
+        ];
+
+    executing1 [label="executing"];
+    executing2 [label="executing"];
+    cancelled [label="cancelled(executing)"];
+    resumed [label="resumed(fetch)"];
+
+    executing1 -> cancelled;
+    cancelled -> released;
+    cancelled -> executing2;
+    released -> forgotten;
+
+    cancelled -> resumed [dir=both];
+    resumed -> executing2;
+    resumed -> memory;
+    resumed -> fetch;
+}
diff --git a/docs/source/images/worker-cancel-state1.svg b/docs/source/images/worker-cancel-state1.svg
new file mode 100644
index 0000000000..243cccc2c5
--- /dev/null
+++ b/docs/source/images/worker-cancel-state1.svg
@@ -0,0 +1,109 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN"
+ "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
+<!-- Generated by graphviz version 3.0.0 (20220315.2325)
+ -->
+<!-- Pages: 1 -->
+<svg width="715pt" height="206pt"
+ viewBox="0.00 0.00 715.25 206.00" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink">
+<g id="graph0" class="graph" transform="scale(1 1) rotate(0) translate(4 202)">
+<polygon fill="#ffffff" fill-opacity="0.941176" stroke="transparent" points="-4,4 -4,-202 711.25,-202 711.25,4 -4,4"/>
+<!-- executing1 -->
+<g id="node1" class="node">
+<title>executing1</title>
+<ellipse fill="none" stroke="black" cx="55.9" cy="-126" rx="55.79" ry="18"/>
+<text text-anchor="middle" x="55.9" y="-122.3" font-family="Times,serif" font-size="14.00">executing</text>
+</g>
+<!-- cancelled -->
+<g id="node3" class="node">
+<title>cancelled</title>
+<ellipse fill="none" stroke="black" cx="254.38" cy="-126" rx="106.68" ry="18"/>
+<text text-anchor="middle" x="254.38" y="-122.3" font-family="Times,serif" font-size="14.00">cancelled(executing)</text>
+</g>
+<!-- executing1&#45;&gt;cancelled -->
+<g id="edge1" class="edge">
+<title>executing1&#45;&gt;cancelled</title>
+<path fill="none" stroke="black" d="M111.89,-126C120.05,-126 128.72,-126 137.58,-126"/>
+<polygon fill="black" stroke="black" points="137.65,-129.5 147.65,-126 137.65,-122.5 137.65,-129.5"/>
+</g>
+<!-- executing2 -->
+<g id="node2" class="node">
+<title>executing2</title>
+<ellipse fill="none" stroke="black" cx="651.35" cy="-180" rx="55.79" ry="18"/>
+<text text-anchor="middle" x="651.35" y="-176.3" font-family="Times,serif" font-size="14.00">executing</text>
+</g>
+<!-- cancelled&#45;&gt;executing2 -->
+<g id="edge3" class="edge">
+<title>cancelled&#45;&gt;executing2</title>
+<path fill="none" stroke="black" d="M322.17,-139.91C345.74,-144.5 372.47,-149.36 396.97,-153 461.25,-162.54 535.18,-170.02 586.52,-174.66"/>
+<polygon fill="black" stroke="black" points="586.53,-178.18 596.8,-175.58 587.16,-171.21 586.53,-178.18"/>
+</g>
+<!-- resumed -->
+<g id="node4" class="node">
+<title>resumed</title>
+<ellipse fill="none" stroke="black" cx="478.21" cy="-126" rx="81.49" ry="18"/>
+<text text-anchor="middle" x="478.21" y="-122.3" font-family="Times,serif" font-size="14.00">resumed(fetch)</text>
+</g>
+<!-- cancelled&#45;&gt;resumed -->
+<g id="edge5" class="edge">
+<title>cancelled&#45;&gt;resumed</title>
+<path fill="none" stroke="black" d="M371.28,-126C376.42,-126 381.55,-126 386.62,-126"/>
+<polygon fill="black" stroke="black" points="371.1,-122.5 361.1,-126 371.1,-129.5 371.1,-122.5"/>
+<polygon fill="black" stroke="black" points="386.93,-129.5 396.93,-126 386.93,-122.5 386.93,-129.5"/>
+</g>
+<!-- released -->
+<g id="node5" class="node">
+<title>released</title>
+<ellipse fill="none" stroke="black" cx="478.21" cy="-45" rx="50.09" ry="18"/>
+<text text-anchor="middle" x="478.21" y="-41.3" font-family="Times,serif" font-size="14.00">released</text>
+</g>
+<!-- cancelled&#45;&gt;released -->
+<g id="edge2" class="edge">
+<title>cancelled&#45;&gt;released</title>
+<path fill="none" stroke="black" d="M300.01,-109.71C338.73,-95.57 394.48,-75.21 433.06,-61.12"/>
+<polygon fill="black" stroke="black" points="434.29,-64.4 442.48,-57.68 431.89,-57.82 434.29,-64.4"/>
+</g>
+<!-- resumed&#45;&gt;executing2 -->
+<g id="edge6" class="edge">
+<title>resumed&#45;&gt;executing2</title>
+<path fill="none" stroke="black" d="M525.98,-140.76C549.27,-148.11 577.43,-156.99 601.07,-164.45"/>
+<polygon fill="black" stroke="black" points="600.3,-167.88 610.89,-167.55 602.4,-161.2 600.3,-167.88"/>
+</g>
+<!-- memory -->
+<g id="node7" class="node">
+<title>memory</title>
+<ellipse fill="none" stroke="black" cx="651.35" cy="-126" rx="48.99" ry="18"/>
+<text text-anchor="middle" x="651.35" y="-122.3" font-family="Times,serif" font-size="14.00">memory</text>
+</g>
+<!-- resumed&#45;&gt;memory -->
+<g id="edge7" class="edge">
+<title>resumed&#45;&gt;memory</title>
+<path fill="none" stroke="black" d="M559.52,-126C570.46,-126 581.52,-126 591.97,-126"/>
+<polygon fill="black" stroke="black" points="592.2,-129.5 602.2,-126 592.2,-122.5 592.2,-129.5"/>
+</g>
+<!-- fetch -->
+<g id="node8" class="node">
+<title>fetch</title>
+<ellipse fill="none" stroke="black" cx="651.35" cy="-72" rx="34.39" ry="18"/>
+<text text-anchor="middle" x="651.35" y="-68.3" font-family="Times,serif" font-size="14.00">fetch</text>
+</g>
+<!-- resumed&#45;&gt;fetch -->
+<g id="edge8" class="edge">
+<title>resumed&#45;&gt;fetch</title>
+<path fill="none" stroke="black" d="M525.98,-111.24C552.89,-102.75 586.29,-92.21 611.71,-84.19"/>
+<polygon fill="black" stroke="black" points="612.89,-87.49 621.37,-81.15 610.78,-80.82 612.89,-87.49"/>
+</g>
+<!-- forgotten -->
+<g id="node6" class="node">
+<title>forgotten</title>
+<ellipse fill="none" stroke="black" cx="651.35" cy="-18" rx="53.89" ry="18"/>
+<text text-anchor="middle" x="651.35" y="-14.3" font-family="Times,serif" font-size="14.00">forgotten</text>
+</g>
+<!-- released&#45;&gt;forgotten -->
+<g id="edge4" class="edge">
+<title>released&#45;&gt;forgotten</title>
+<path fill="none" stroke="black" d="M524.63,-37.84C545.41,-34.56 570.28,-30.63 592.39,-27.14"/>
+<polygon fill="black" stroke="black" points="593,-30.59 602.33,-25.58 591.91,-23.68 593,-30.59"/>
+</g>
+</g>
+</svg>
diff --git a/docs/source/images/worker-cancel-state2.dot b/docs/source/images/worker-cancel-state2.dot
new file mode 100644
index 0000000000..e5bdcfcad2
--- /dev/null
+++ b/docs/source/images/worker-cancel-state2.dot
@@ -0,0 +1,21 @@
+digraph{
+    graph [
+        bgcolor="#FFFFFFF00",
+        rankdir=LR,
+        ];
+
+    flight1 [label=flight];
+    flight2 [label=flight];
+    cancelled [label="cancelled(flight)"];
+    resumed [label="resumed(waiting)"];
+
+    flight1 -> cancelled;
+    cancelled -> flight2;
+    cancelled -> released;
+    released -> forgotten;
+
+    cancelled -> resumed [dir=both];
+    resumed -> flight2;
+    resumed -> memory;
+    resumed -> waiting;
+}
diff --git a/docs/source/images/worker-cancel-state2.svg b/docs/source/images/worker-cancel-state2.svg
new file mode 100644
index 0000000000..31c391f5a2
--- /dev/null
+++ b/docs/source/images/worker-cancel-state2.svg
@@ -0,0 +1,109 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN"
+ "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
+<!-- Generated by graphviz version 3.0.0 (20220315.2325)
+ -->
+<!-- Pages: 1 -->
+<svg width="650pt" height="206pt"
+ viewBox="0.00 0.00 650.25 206.00" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink">
+<g id="graph0" class="graph" transform="scale(1 1) rotate(0) translate(4 202)">
+<polygon fill="#ffffff" fill-opacity="0.941176" stroke="transparent" points="-4,4 -4,-202 646.25,-202 646.25,4 -4,4"/>
+<!-- flight1 -->
+<g id="node1" class="node">
+<title>flight1</title>
+<ellipse fill="none" stroke="black" cx="35.1" cy="-126" rx="35.19" ry="18"/>
+<text text-anchor="middle" x="35.1" y="-122.3" font-family="Times,serif" font-size="14.00">flight</text>
+</g>
+<!-- cancelled -->
+<g id="node3" class="node">
+<title>cancelled</title>
+<ellipse fill="none" stroke="black" cx="191.34" cy="-126" rx="85.29" ry="18"/>
+<text text-anchor="middle" x="191.34" y="-122.3" font-family="Times,serif" font-size="14.00">cancelled(flight)</text>
+</g>
+<!-- flight1&#45;&gt;cancelled -->
+<g id="edge1" class="edge">
+<title>flight1&#45;&gt;cancelled</title>
+<path fill="none" stroke="black" d="M70.33,-126C78.13,-126 86.79,-126 95.79,-126"/>
+<polygon fill="black" stroke="black" points="96.06,-129.5 106.06,-126 96.06,-122.5 96.06,-129.5"/>
+</g>
+<!-- flight2 -->
+<g id="node2" class="node">
+<title>flight2</title>
+<ellipse fill="none" stroke="black" cx="588.31" cy="-180" rx="35.19" ry="18"/>
+<text text-anchor="middle" x="588.31" y="-176.3" font-family="Times,serif" font-size="14.00">flight</text>
+</g>
+<!-- cancelled&#45;&gt;flight2 -->
+<g id="edge2" class="edge">
+<title>cancelled&#45;&gt;flight2</title>
+<path fill="none" stroke="black" d="M246.79,-139.73C267.27,-144.5 290.84,-149.52 312.48,-153 393.41,-166.02 488.83,-173.69 543.28,-177.35"/>
+<polygon fill="black" stroke="black" points="543.08,-180.85 553.29,-178.01 543.54,-173.86 543.08,-180.85"/>
+</g>
+<!-- resumed -->
+<g id="node4" class="node">
+<title>resumed</title>
+<ellipse fill="none" stroke="black" cx="405.42" cy="-126" rx="92.88" ry="18"/>
+<text text-anchor="middle" x="405.42" y="-122.3" font-family="Times,serif" font-size="14.00">resumed(waiting)</text>
+</g>
+<!-- cancelled&#45;&gt;resumed -->
+<g id="edge5" class="edge">
+<title>cancelled&#45;&gt;resumed</title>
+<path fill="none" stroke="black" d="M286.96,-126C291.95,-126 296.98,-126 302,-126"/>
+<polygon fill="black" stroke="black" points="286.77,-122.5 276.77,-126 286.77,-129.5 286.77,-122.5"/>
+<polygon fill="black" stroke="black" points="302.26,-129.5 312.26,-126 302.26,-122.5 302.26,-129.5"/>
+</g>
+<!-- released -->
+<g id="node5" class="node">
+<title>released</title>
+<ellipse fill="none" stroke="black" cx="405.42" cy="-45" rx="50.09" ry="18"/>
+<text text-anchor="middle" x="405.42" y="-41.3" font-family="Times,serif" font-size="14.00">released</text>
+</g>
+<!-- cancelled&#45;&gt;released -->
+<g id="edge3" class="edge">
+<title>cancelled&#45;&gt;released</title>
+<path fill="none" stroke="black" d="M233.48,-110.29C270.08,-96.31 323.44,-75.93 360.78,-61.67"/>
+<polygon fill="black" stroke="black" points="362.29,-64.84 370.38,-58 359.79,-58.3 362.29,-64.84"/>
+</g>
+<!-- resumed&#45;&gt;flight2 -->
+<g id="edge6" class="edge">
+<title>resumed&#45;&gt;flight2</title>
+<path fill="none" stroke="black" d="M456.81,-141.04C485.54,-149.62 521.04,-160.22 547.75,-168.19"/>
+<polygon fill="black" stroke="black" points="546.95,-171.6 557.53,-171.11 548.95,-164.9 546.95,-171.6"/>
+</g>
+<!-- memory -->
+<g id="node7" class="node">
+<title>memory</title>
+<ellipse fill="none" stroke="black" cx="588.31" cy="-126" rx="48.99" ry="18"/>
+<text text-anchor="middle" x="588.31" y="-122.3" font-family="Times,serif" font-size="14.00">memory</text>
+</g>
+<!-- resumed&#45;&gt;memory -->
+<g id="edge7" class="edge">
+<title>resumed&#45;&gt;memory</title>
+<path fill="none" stroke="black" d="M498.45,-126C508.95,-126 519.41,-126 529.28,-126"/>
+<polygon fill="black" stroke="black" points="529.33,-129.5 539.33,-126 529.33,-122.5 529.33,-129.5"/>
+</g>
+<!-- waiting -->
+<g id="node8" class="node">
+<title>waiting</title>
+<ellipse fill="none" stroke="black" cx="588.31" cy="-72" rx="45.49" ry="18"/>
+<text text-anchor="middle" x="588.31" y="-68.3" font-family="Times,serif" font-size="14.00">waiting</text>
+</g>
+<!-- resumed&#45;&gt;waiting -->
+<g id="edge8" class="edge">
+<title>resumed&#45;&gt;waiting</title>
+<path fill="none" stroke="black" d="M456.81,-110.96C483.39,-103.02 515.75,-93.36 541.6,-85.65"/>
+<polygon fill="black" stroke="black" points="542.93,-88.9 551.52,-82.68 540.93,-82.19 542.93,-88.9"/>
+</g>
+<!-- forgotten -->
+<g id="node6" class="node">
+<title>forgotten</title>
+<ellipse fill="none" stroke="black" cx="588.31" cy="-18" rx="53.89" ry="18"/>
+<text text-anchor="middle" x="588.31" y="-14.3" font-family="Times,serif" font-size="14.00">forgotten</text>
+</g>
+<!-- released&#45;&gt;forgotten -->
+<g id="edge4" class="edge">
+<title>released&#45;&gt;forgotten</title>
+<path fill="none" stroke="black" d="M452.07,-38.19C475.34,-34.71 503.91,-30.45 528.78,-26.74"/>
+<polygon fill="black" stroke="black" points="529.45,-30.17 538.83,-25.24 528.42,-23.25 529.45,-30.17"/>
+</g>
+</g>
+</svg>
diff --git a/docs/source/images/worker-dep-state.dot b/docs/source/images/worker-dep-state.dot
index 18a5e40cfa..44ba3a7266 100644
--- a/docs/source/images/worker-dep-state.dot
+++ b/docs/source/images/worker-dep-state.dot
@@ -3,8 +3,11 @@ digraph{
         bgcolor="#FFFFFFF00",
         rankdir=LR,
         ];
-    new -> fetch;
+
+    released -> fetch;
     fetch -> flight;
     flight -> fetch;
+    fetch -> missing;
+    missing -> fetch;
     flight -> memory;
 }
diff --git a/docs/source/images/worker-dep-state.svg b/docs/source/images/worker-dep-state.svg
index 9b7b04e8d9..76e83eb4c9 100644
--- a/docs/source/images/worker-dep-state.svg
+++ b/docs/source/images/worker-dep-state.svg
@@ -1,61 +1,78 @@
 <?xml version="1.0" encoding="UTF-8" standalone="no"?>
 <!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN"
  "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
-<!-- Generated by graphviz version 2.42.3 (20191010.1750)
+<!-- Generated by graphviz version 3.0.0 (20220315.2325)
  -->
-<!-- Title: %3 Pages: 1 -->
-<svg width="369pt" height="44pt"
- viewBox="0.00 0.00 368.88 44.00" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink">
-<g id="graph0" class="graph" transform="scale(1 1) rotate(0) translate(4 40)">
-<title>%3</title>
-<polygon fill="#ffffff" fill-opacity="0.941176" stroke="transparent" points="-4,4 -4,-40 364.88,-40 364.88,4 -4,4"/>
-<!-- new -->
+<!-- Pages: 1 -->
+<svg width="476pt" height="98pt"
+ viewBox="0.00 0.00 476.07 98.00" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink">
+<g id="graph0" class="graph" transform="scale(1 1) rotate(0) translate(4 94)">
+<polygon fill="#ffffff" fill-opacity="0.941176" stroke="transparent" points="-4,4 -4,-94 472.07,-94 472.07,4 -4,4"/>
+<!-- released -->
 <g id="node1" class="node">
-<title>new</title>
-<ellipse fill="none" stroke="black" cx="27" cy="-18" rx="27" ry="18"/>
-<text text-anchor="middle" x="27" y="-14.3" font-family="Times,serif" font-size="14.00">new</text>
+<title>released</title>
+<ellipse fill="none" stroke="black" cx="50.05" cy="-45" rx="50.09" ry="18"/>
+<text text-anchor="middle" x="50.05" y="-41.3" font-family="Times,serif" font-size="14.00">released</text>
 </g>
 <!-- fetch -->
 <g id="node2" class="node">
 <title>fetch</title>
-<ellipse fill="none" stroke="black" cx="118.6" cy="-18" rx="28.7" ry="18"/>
-<text text-anchor="middle" x="118.6" y="-14.3" font-family="Times,serif" font-size="14.00">fetch</text>
+<ellipse fill="none" stroke="black" cx="170.54" cy="-45" rx="34.39" ry="18"/>
+<text text-anchor="middle" x="170.54" y="-41.3" font-family="Times,serif" font-size="14.00">fetch</text>
 </g>
-<!-- new&#45;&gt;fetch -->
+<!-- released&#45;&gt;fetch -->
 <g id="edge1" class="edge">
-<title>new&#45;&gt;fetch</title>
-<path fill="none" stroke="black" d="M54.4,-18C62.32,-18 71.18,-18 79.7,-18"/>
-<polygon fill="black" stroke="black" points="79.83,-21.5 89.83,-18 79.83,-14.5 79.83,-21.5"/>
+<title>released&#45;&gt;fetch</title>
+<path fill="none" stroke="black" d="M100.27,-45C108.67,-45 117.36,-45 125.61,-45"/>
+<polygon fill="black" stroke="black" points="125.79,-48.5 135.79,-45 125.79,-41.5 125.79,-48.5"/>
 </g>
 <!-- flight -->
 <g id="node3" class="node">
 <title>flight</title>
-<ellipse fill="none" stroke="black" cx="213.09" cy="-18" rx="29.8" ry="18"/>
-<text text-anchor="middle" x="213.09" y="-14.3" font-family="Times,serif" font-size="14.00">flight</text>
+<ellipse fill="none" stroke="black" cx="287.78" cy="-72" rx="35.19" ry="18"/>
+<text text-anchor="middle" x="287.78" y="-68.3" font-family="Times,serif" font-size="14.00">flight</text>
 </g>
 <!-- fetch&#45;&gt;flight -->
 <g id="edge2" class="edge">
 <title>fetch&#45;&gt;flight</title>
-<path fill="none" stroke="black" d="M145.86,-11.84C154.8,-11.28 164.98,-11.12 174.62,-11.36"/>
-<polygon fill="black" stroke="black" points="174.67,-14.86 184.8,-11.78 174.96,-7.87 174.67,-14.86"/>
+<path fill="none" stroke="black" d="M204.87,-46.62C219.35,-49.3 236.32,-53.24 251.06,-57.33"/>
+<polygon fill="black" stroke="black" points="250.26,-60.75 260.84,-60.18 252.22,-54.03 250.26,-60.75"/>
+</g>
+<!-- missing -->
+<g id="node4" class="node">
+<title>missing</title>
+<ellipse fill="none" stroke="black" cx="287.78" cy="-18" rx="46.59" ry="18"/>
+<text text-anchor="middle" x="287.78" y="-14.3" font-family="Times,serif" font-size="14.00">missing</text>
+</g>
+<!-- fetch&#45;&gt;missing -->
+<g id="edge4" class="edge">
+<title>fetch&#45;&gt;missing</title>
+<path fill="none" stroke="black" d="M197.11,-33.29C207.37,-30.15 219.62,-26.94 231.71,-24.16"/>
+<polygon fill="black" stroke="black" points="232.77,-27.51 241.79,-21.94 231.27,-20.67 232.77,-27.51"/>
 </g>
 <!-- flight&#45;&gt;fetch -->
 <g id="edge3" class="edge">
 <title>flight&#45;&gt;fetch</title>
-<path fill="none" stroke="black" d="M184.8,-24.22C175.77,-24.75 165.57,-24.88 155.96,-24.61"/>
-<polygon fill="black" stroke="black" points="156,-21.11 145.86,-24.16 155.69,-28.1 156,-21.11"/>
+<path fill="none" stroke="black" d="M252.53,-70.21C238.09,-67.5 221.3,-63.58 206.76,-59.53"/>
+<polygon fill="black" stroke="black" points="207.69,-56.15 197.11,-56.71 205.73,-62.87 207.69,-56.15"/>
 </g>
 <!-- memory -->
-<g id="node4" class="node">
+<g id="node5" class="node">
 <title>memory</title>
-<ellipse fill="none" stroke="black" cx="319.94" cy="-18" rx="40.89" ry="18"/>
-<text text-anchor="middle" x="319.94" y="-14.3" font-family="Times,serif" font-size="14.00">memory</text>
+<ellipse fill="none" stroke="black" cx="419.32" cy="-72" rx="48.99" ry="18"/>
+<text text-anchor="middle" x="419.32" y="-68.3" font-family="Times,serif" font-size="14.00">memory</text>
 </g>
 <!-- flight&#45;&gt;memory -->
-<g id="edge4" class="edge">
+<g id="edge6" class="edge">
 <title>flight&#45;&gt;memory</title>
-<path fill="none" stroke="black" d="M243.02,-18C250.95,-18 259.78,-18 268.54,-18"/>
-<polygon fill="black" stroke="black" points="268.73,-21.5 278.73,-18 268.73,-14.5 268.73,-21.5"/>
+<path fill="none" stroke="black" d="M323.16,-72C334.51,-72 347.48,-72 360.11,-72"/>
+<polygon fill="black" stroke="black" points="360.13,-75.5 370.13,-72 360.13,-68.5 360.13,-75.5"/>
+</g>
+<!-- missing&#45;&gt;fetch -->
+<g id="edge5" class="edge">
+<title>missing&#45;&gt;fetch</title>
+<path fill="none" stroke="black" d="M255.89,-31.3C243.34,-34.94 228.61,-38.56 215,-41.38"/>
+<polygon fill="black" stroke="black" points="214.01,-38.01 204.87,-43.38 215.36,-44.88 214.01,-38.01"/>
 </g>
 </g>
 </svg>
diff --git a/docs/source/images/worker-task-state.dot b/docs/source/images/worker-execute-state.dot
similarity index 64%
rename from docs/source/images/worker-task-state.dot
rename to docs/source/images/worker-execute-state.dot
index 4a6fc8cbac..769993c30d 100644
--- a/docs/source/images/worker-task-state.dot
+++ b/docs/source/images/worker-execute-state.dot
@@ -3,12 +3,16 @@ digraph{
         bgcolor="#FFFFFFF00",
         rankdir=LR,
         ];
-    new -> waiting;
+    released -> waiting;
     waiting -> ready;
+    waiting -> constrained;
     ready -> executing;
+    constrained -> executing;
     executing -> "long-running";
     executing -> memory;
     executing -> error;
+    executing -> rescheduled;
     "long-running" -> memory;
     "long-running" -> error;
+    "long-running" -> rescheduled;
 }
diff --git a/docs/source/images/worker-execute-state.svg b/docs/source/images/worker-execute-state.svg
new file mode 100644
index 0000000000..f12b58f65d
--- /dev/null
+++ b/docs/source/images/worker-execute-state.svg
@@ -0,0 +1,138 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN"
+ "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
+<!-- Generated by graphviz version 3.0.0 (20220315.2325)
+ -->
+<!-- Pages: 1 -->
+<svg width="898pt" height="160pt"
+ viewBox="0.00 0.00 897.74 160.00" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink">
+<g id="graph0" class="graph" transform="scale(1 1) rotate(0) translate(4 156)">
+<polygon fill="#ffffff" fill-opacity="0.941176" stroke="transparent" points="-4,4 -4,-156 893.74,-156 893.74,4 -4,4"/>
+<!-- released -->
+<g id="node1" class="node">
+<title>released</title>
+<ellipse fill="none" stroke="black" cx="50.05" cy="-68" rx="50.09" ry="18"/>
+<text text-anchor="middle" x="50.05" y="-64.3" font-family="Times,serif" font-size="14.00">released</text>
+</g>
+<!-- waiting -->
+<g id="node2" class="node">
+<title>waiting</title>
+<ellipse fill="none" stroke="black" cx="181.59" cy="-68" rx="45.49" ry="18"/>
+<text text-anchor="middle" x="181.59" y="-64.3" font-family="Times,serif" font-size="14.00">waiting</text>
+</g>
+<!-- released&#45;&gt;waiting -->
+<g id="edge1" class="edge">
+<title>released&#45;&gt;waiting</title>
+<path fill="none" stroke="black" d="M100.39,-68C108.73,-68 117.42,-68 125.89,-68"/>
+<polygon fill="black" stroke="black" points="126.05,-71.5 136.05,-68 126.05,-64.5 126.05,-71.5"/>
+</g>
+<!-- ready -->
+<g id="node3" class="node">
+<title>ready</title>
+<ellipse fill="none" stroke="black" cx="328.73" cy="-95" rx="37.09" ry="18"/>
+<text text-anchor="middle" x="328.73" y="-91.3" font-family="Times,serif" font-size="14.00">ready</text>
+</g>
+<!-- waiting&#45;&gt;ready -->
+<g id="edge2" class="edge">
+<title>waiting&#45;&gt;ready</title>
+<path fill="none" stroke="black" d="M223.02,-75.52C241.93,-79.04 264.49,-83.24 283.82,-86.83"/>
+<polygon fill="black" stroke="black" points="283.42,-90.32 293.89,-88.71 284.7,-83.44 283.42,-90.32"/>
+</g>
+<!-- constrained -->
+<g id="node4" class="node">
+<title>constrained</title>
+<ellipse fill="none" stroke="black" cx="328.73" cy="-41" rx="65.79" ry="18"/>
+<text text-anchor="middle" x="328.73" y="-37.3" font-family="Times,serif" font-size="14.00">constrained</text>
+</g>
+<!-- waiting&#45;&gt;constrained -->
+<g id="edge3" class="edge">
+<title>waiting&#45;&gt;constrained</title>
+<path fill="none" stroke="black" d="M223.02,-60.48C235.71,-58.12 250.04,-55.45 263.93,-52.87"/>
+<polygon fill="black" stroke="black" points="264.76,-56.27 273.95,-51 263.48,-49.39 264.76,-56.27"/>
+</g>
+<!-- executing -->
+<g id="node5" class="node">
+<title>executing</title>
+<ellipse fill="none" stroke="black" cx="486.27" cy="-68" rx="55.79" ry="18"/>
+<text text-anchor="middle" x="486.27" y="-64.3" font-family="Times,serif" font-size="14.00">executing</text>
+</g>
+<!-- ready&#45;&gt;executing -->
+<g id="edge4" class="edge">
+<title>ready&#45;&gt;executing</title>
+<path fill="none" stroke="black" d="M363.86,-89.07C382.31,-85.87 405.61,-81.83 426.85,-78.14"/>
+<polygon fill="black" stroke="black" points="427.5,-81.58 436.76,-76.42 426.3,-74.68 427.5,-81.58"/>
+</g>
+<!-- constrained&#45;&gt;executing -->
+<g id="edge5" class="edge">
+<title>constrained&#45;&gt;executing</title>
+<path fill="none" stroke="black" d="M384.56,-50.52C398.22,-52.89 412.91,-55.44 426.73,-57.84"/>
+<polygon fill="black" stroke="black" points="426.17,-61.29 436.62,-59.56 427.36,-54.4 426.17,-61.29"/>
+</g>
+<!-- long&#45;running -->
+<g id="node6" class="node">
+<title>long&#45;running</title>
+<ellipse fill="none" stroke="black" cx="648.36" cy="-91" rx="70.39" ry="18"/>
+<text text-anchor="middle" x="648.36" y="-87.3" font-family="Times,serif" font-size="14.00">long&#45;running</text>
+</g>
+<!-- executing&#45;&gt;long&#45;running -->
+<g id="edge6" class="edge">
+<title>executing&#45;&gt;long&#45;running</title>
+<path fill="none" stroke="black" d="M537.48,-75.21C549.9,-77 563.44,-78.94 576.64,-80.84"/>
+<polygon fill="black" stroke="black" points="576.25,-84.32 586.64,-82.28 577.24,-77.39 576.25,-84.32"/>
+</g>
+<!-- memory -->
+<g id="node7" class="node">
+<title>memory</title>
+<ellipse fill="none" stroke="black" cx="822.14" cy="-134" rx="48.99" ry="18"/>
+<text text-anchor="middle" x="822.14" y="-130.3" font-family="Times,serif" font-size="14.00">memory</text>
+</g>
+<!-- executing&#45;&gt;memory -->
+<g id="edge7" class="edge">
+<title>executing&#45;&gt;memory</title>
+<path fill="none" stroke="black" d="M510.31,-84.4C527.98,-96.02 553.44,-110.78 578.16,-118 639.72,-135.99 713.65,-138.28 763.67,-137.15"/>
+<polygon fill="black" stroke="black" points="764.07,-140.65 773.97,-136.87 763.88,-133.65 764.07,-140.65"/>
+</g>
+<!-- error -->
+<g id="node8" class="node">
+<title>error</title>
+<ellipse fill="none" stroke="black" cx="822.14" cy="-77" rx="34.39" ry="18"/>
+<text text-anchor="middle" x="822.14" y="-73.3" font-family="Times,serif" font-size="14.00">error</text>
+</g>
+<!-- executing&#45;&gt;error -->
+<g id="edge8" class="edge">
+<title>executing&#45;&gt;error</title>
+<path fill="none" stroke="black" d="M541.57,-65.22C553.61,-64.71 566.32,-64.26 578.16,-64 640.54,-62.63 656.28,-60.07 718.55,-64 738.41,-65.25 760.31,-67.86 778.76,-70.41"/>
+<polygon fill="black" stroke="black" points="778.5,-73.91 788.9,-71.86 779.49,-66.98 778.5,-73.91"/>
+</g>
+<!-- rescheduled -->
+<g id="node9" class="node">
+<title>rescheduled</title>
+<ellipse fill="none" stroke="black" cx="822.14" cy="-18" rx="67.69" ry="18"/>
+<text text-anchor="middle" x="822.14" y="-14.3" font-family="Times,serif" font-size="14.00">rescheduled</text>
+</g>
+<!-- executing&#45;&gt;rescheduled -->
+<g id="edge9" class="edge">
+<title>executing&#45;&gt;rescheduled</title>
+<path fill="none" stroke="black" d="M537.25,-60.51C594.58,-51.93 688.89,-37.81 752.94,-28.21"/>
+<polygon fill="black" stroke="black" points="753.57,-31.66 762.94,-26.72 752.54,-24.74 753.57,-31.66"/>
+</g>
+<!-- long&#45;running&#45;&gt;memory -->
+<g id="edge10" class="edge">
+<title>long&#45;running&#45;&gt;memory</title>
+<path fill="none" stroke="black" d="M699.51,-103.55C722.19,-109.23 748.93,-115.92 771.55,-121.59"/>
+<polygon fill="black" stroke="black" points="770.75,-124.99 781.3,-124.03 772.45,-118.2 770.75,-124.99"/>
+</g>
+<!-- long&#45;running&#45;&gt;error -->
+<g id="edge11" class="edge">
+<title>long&#45;running&#45;&gt;error</title>
+<path fill="none" stroke="black" d="M715.77,-85.59C736.64,-83.89 759.14,-82.05 777.96,-80.52"/>
+<polygon fill="black" stroke="black" points="778.32,-84 788,-79.7 777.75,-77.02 778.32,-84"/>
+</g>
+<!-- long&#45;running&#45;&gt;rescheduled -->
+<g id="edge12" class="edge">
+<title>long&#45;running&#45;&gt;rescheduled</title>
+<path fill="none" stroke="black" d="M685.37,-75.7C711.8,-64.47 747.87,-49.14 776.19,-37.1"/>
+<polygon fill="black" stroke="black" points="777.64,-40.29 785.47,-33.16 774.9,-33.85 777.64,-40.29"/>
+</g>
+</g>
+</svg>
diff --git a/docs/source/images/worker-forget-state.dot b/docs/source/images/worker-forget-state.dot
new file mode 100644
index 0000000000..8eee411fa3
--- /dev/null
+++ b/docs/source/images/worker-forget-state.dot
@@ -0,0 +1,15 @@
+digraph{
+    graph [
+        bgcolor="#FFFFFFF00",
+        rankdir=LR,
+        ];
+    free_keys [
+      label="Wait for free-keys\nfrom the scheduler",
+      shape=box,style=dashed,
+    ];
+    memory -> free_keys;
+    error -> free_keys;
+    free_keys -> released;
+    rescheduled -> released;
+    released -> forgotten;
+}
diff --git a/docs/source/images/worker-forget-state.svg b/docs/source/images/worker-forget-state.svg
new file mode 100644
index 0000000000..64cf54891e
--- /dev/null
+++ b/docs/source/images/worker-forget-state.svg
@@ -0,0 +1,79 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN"
+ "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
+<!-- Generated by graphviz version 3.0.0 (20220315.2325)
+ -->
+<!-- Pages: 1 -->
+<svg width="573pt" height="126pt"
+ viewBox="0.00 0.00 573.47 126.00" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink">
+<g id="graph0" class="graph" transform="scale(1 1) rotate(0) translate(4 122)">
+<polygon fill="#ffffff" fill-opacity="0.941176" stroke="transparent" points="-4,4 -4,-122 569.47,-122 569.47,4 -4,4"/>
+<!-- free_keys -->
+<g id="node1" class="node">
+<title>free_keys</title>
+<polygon fill="none" stroke="black" stroke-dasharray="5,2" points="285.49,-64 133.49,-64 133.49,-26 285.49,-26 285.49,-64"/>
+<text text-anchor="middle" x="209.49" y="-48.8" font-family="Times,serif" font-size="14.00">Wait for free&#45;keys</text>
+<text text-anchor="middle" x="209.49" y="-33.8" font-family="Times,serif" font-size="14.00">from the scheduler</text>
+</g>
+<!-- released -->
+<g id="node4" class="node">
+<title>released</title>
+<ellipse fill="none" stroke="black" cx="371.54" cy="-72" rx="50.09" ry="18"/>
+<text text-anchor="middle" x="371.54" y="-68.3" font-family="Times,serif" font-size="14.00">released</text>
+</g>
+<!-- free_keys&#45;&gt;released -->
+<g id="edge3" class="edge">
+<title>free_keys&#45;&gt;released</title>
+<path fill="none" stroke="black" d="M285.83,-57.71C295.83,-59.4 305.93,-61.1 315.5,-62.72"/>
+<polygon fill="black" stroke="black" points="315.21,-66.22 325.65,-64.43 316.37,-59.31 315.21,-66.22"/>
+</g>
+<!-- memory -->
+<g id="node2" class="node">
+<title>memory</title>
+<ellipse fill="none" stroke="black" cx="48.75" cy="-72" rx="48.99" ry="18"/>
+<text text-anchor="middle" x="48.75" y="-68.3" font-family="Times,serif" font-size="14.00">memory</text>
+</g>
+<!-- memory&#45;&gt;free_keys -->
+<g id="edge1" class="edge">
+<title>memory&#45;&gt;free_keys</title>
+<path fill="none" stroke="black" d="M93.54,-64.55C102.93,-62.95 113.16,-61.21 123.51,-59.45"/>
+<polygon fill="black" stroke="black" points="124.18,-62.89 133.46,-57.76 123.01,-55.99 124.18,-62.89"/>
+</g>
+<!-- error -->
+<g id="node3" class="node">
+<title>error</title>
+<ellipse fill="none" stroke="black" cx="48.75" cy="-18" rx="34.39" ry="18"/>
+<text text-anchor="middle" x="48.75" y="-14.3" font-family="Times,serif" font-size="14.00">error</text>
+</g>
+<!-- error&#45;&gt;free_keys -->
+<g id="edge2" class="edge">
+<title>error&#45;&gt;free_keys</title>
+<path fill="none" stroke="black" d="M81.87,-23.46C94.02,-25.53 108.48,-27.99 123.22,-30.5"/>
+<polygon fill="black" stroke="black" points="123,-34.01 133.44,-32.24 124.17,-27.11 123,-34.01"/>
+</g>
+<!-- forgotten -->
+<g id="node6" class="node">
+<title>forgotten</title>
+<ellipse fill="none" stroke="black" cx="511.53" cy="-72" rx="53.89" ry="18"/>
+<text text-anchor="middle" x="511.53" y="-68.3" font-family="Times,serif" font-size="14.00">forgotten</text>
+</g>
+<!-- released&#45;&gt;forgotten -->
+<g id="edge5" class="edge">
+<title>released&#45;&gt;forgotten</title>
+<path fill="none" stroke="black" d="M421.96,-72C430.1,-72 438.63,-72 447.06,-72"/>
+<polygon fill="black" stroke="black" points="447.24,-75.5 457.24,-72 447.24,-68.5 447.24,-75.5"/>
+</g>
+<!-- rescheduled -->
+<g id="node5" class="node">
+<title>rescheduled</title>
+<ellipse fill="none" stroke="black" cx="209.49" cy="-100" rx="67.69" ry="18"/>
+<text text-anchor="middle" x="209.49" y="-96.3" font-family="Times,serif" font-size="14.00">rescheduled</text>
+</g>
+<!-- rescheduled&#45;&gt;released -->
+<g id="edge4" class="edge">
+<title>rescheduled&#45;&gt;released</title>
+<path fill="none" stroke="black" d="M266.47,-90.21C282.51,-87.4 299.98,-84.34 315.94,-81.55"/>
+<polygon fill="black" stroke="black" points="316.94,-84.93 326.18,-79.76 315.73,-78.04 316.94,-84.93"/>
+</g>
+</g>
+</svg>
diff --git a/docs/source/images/worker-scatter-state.dot b/docs/source/images/worker-scatter-state.dot
new file mode 100644
index 0000000000..cc36ce3d71
--- /dev/null
+++ b/docs/source/images/worker-scatter-state.dot
@@ -0,0 +1,7 @@
+digraph{
+    graph [
+        bgcolor="#FFFFFFF00",
+        rankdir=LR,
+        ];
+    released -> memory;
+}
diff --git a/docs/source/images/worker-scatter-state.svg b/docs/source/images/worker-scatter-state.svg
new file mode 100644
index 0000000000..ee0654021e
--- /dev/null
+++ b/docs/source/images/worker-scatter-state.svg
@@ -0,0 +1,30 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN"
+ "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
+<!-- Generated by graphviz version 3.0.0 (20220315.2325)
+ -->
+<!-- Pages: 1 -->
+<svg width="242pt" height="44pt"
+ viewBox="0.00 0.00 241.58 44.00" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink">
+<g id="graph0" class="graph" transform="scale(1 1) rotate(0) translate(4 40)">
+<polygon fill="#ffffff" fill-opacity="0.941176" stroke="transparent" points="-4,4 -4,-40 237.58,-40 237.58,4 -4,4"/>
+<!-- released -->
+<g id="node1" class="node">
+<title>released</title>
+<ellipse fill="none" stroke="black" cx="50.05" cy="-18" rx="50.09" ry="18"/>
+<text text-anchor="middle" x="50.05" y="-14.3" font-family="Times,serif" font-size="14.00">released</text>
+</g>
+<!-- memory -->
+<g id="node2" class="node">
+<title>memory</title>
+<ellipse fill="none" stroke="black" cx="184.84" cy="-18" rx="48.99" ry="18"/>
+<text text-anchor="middle" x="184.84" y="-14.3" font-family="Times,serif" font-size="14.00">memory</text>
+</g>
+<!-- released&#45;&gt;memory -->
+<g id="edge1" class="edge">
+<title>released&#45;&gt;memory</title>
+<path fill="none" stroke="black" d="M100.11,-18C108.41,-18 117.1,-18 125.61,-18"/>
+<polygon fill="black" stroke="black" points="125.85,-21.5 135.85,-18 125.85,-14.5 125.85,-21.5"/>
+</g>
+</g>
+</svg>
diff --git a/docs/source/images/worker-state-machine.dot b/docs/source/images/worker-state-machine.dot
new file mode 100644
index 0000000000..a3cd798ac8
--- /dev/null
+++ b/docs/source/images/worker-state-machine.dot
@@ -0,0 +1,55 @@
+digraph {
+  graph [
+    bgcolor="#FFFFFFF00",
+    rankdir=TB,
+  ];
+
+  Scheduler [
+    shape=rect,
+    fontsize = 20,
+  ];
+
+  stimuli [
+    label="StateMachineEvent",
+    shape=rect,
+    style=filled,
+    color=grey,
+  ];
+
+  instructions [
+    label="list[Instruction]",
+    shape=rect,
+    style=filled,
+    color=grey,
+  ];
+
+  subgraph cluster_0 {
+    label = "Worker";
+    fontsize = 20;
+
+    Worker_handle_stimulus [label="handle_stimulus()"];
+    Worker_execute [label="execute()\ngather_dep()\nbatched_send()"];
+  }
+
+  subgraph cluster_1 {
+    label = "BaseWorker";
+    fontsize = 20;
+
+    BaseWorker_handle_stimulus [label="handle_stimulus()"];
+    BaseWorker_execute [label="execute()\ngather_dep()\nbatched_send()"];
+  }
+
+  subgraph cluster_2 {
+    label = "WorkerState";
+    fontsize = 20;
+
+    WorkerState_handle_stimulus [label="handle_stimulus()"];
+  }
+
+  Scheduler -> stimuli;
+  stimuli -> Worker_handle_stimulus;
+  Worker_handle_stimulus -> BaseWorker_handle_stimulus;
+  BaseWorker_handle_stimulus -> WorkerState_handle_stimulus;
+  # trick to have arrows going from the bottom to the top of the graph
+  stimuli -> Worker_execute -> BaseWorker_execute -> instructions -> WorkerState_handle_stimulus [dir=back];
+}
diff --git a/docs/source/images/worker-state-machine.svg b/docs/source/images/worker-state-machine.svg
new file mode 100644
index 0000000000..ef0e4bf476
--- /dev/null
+++ b/docs/source/images/worker-state-machine.svg
@@ -0,0 +1,127 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN"
+ "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
+<!-- Generated by graphviz version 3.0.0 (20220315.2325)
+ -->
+<!-- Pages: 1 -->
+<svg width="420pt" height="536pt"
+ viewBox="0.00 0.00 420.00 535.91" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink">
+<g id="graph0" class="graph" transform="scale(1 1) rotate(0) translate(4 531.91)">
+<polygon fill="#ffffff" fill-opacity="0.941176" stroke="transparent" points="-4,4 -4,-531.91 416,-531.91 416,4 -4,4"/>
+<g id="clust1" class="cluster">
+<title>cluster_0</title>
+<polygon fill="#ffffff" fill-opacity="0.941176" stroke="black" points="8,-290.95 8,-411.91 404,-411.91 404,-290.95 8,-290.95"/>
+<text text-anchor="middle" x="206" y="-391.91" font-family="Times,serif" font-size="20.00">Worker</text>
+</g>
+<g id="clust2" class="cluster">
+<title>cluster_1</title>
+<polygon fill="#ffffff" fill-opacity="0.941176" stroke="black" points="8,-162 8,-282.95 404,-282.95 404,-162 8,-162"/>
+<text text-anchor="middle" x="206" y="-262.95" font-family="Times,serif" font-size="20.00">BaseWorker</text>
+</g>
+<g id="clust3" class="cluster">
+<title>cluster_2</title>
+<polygon fill="#ffffff" fill-opacity="0.941176" stroke="black" points="50,-8 50,-90 252,-90 252,-8 50,-8"/>
+<text text-anchor="middle" x="151" y="-70" font-family="Times,serif" font-size="20.00">WorkerState</text>
+</g>
+<!-- Scheduler -->
+<g id="node1" class="node">
+<title>Scheduler</title>
+<polygon fill="none" stroke="black" points="263,-527.91 143,-527.91 143,-491.91 263,-491.91 263,-527.91"/>
+<text text-anchor="middle" x="203" y="-504.91" font-family="Times,serif" font-size="20.00">Scheduler</text>
+</g>
+<!-- stimuli -->
+<g id="node2" class="node">
+<title>stimuli</title>
+<polygon fill="grey" stroke="grey" points="282,-455.91 124,-455.91 124,-419.91 282,-419.91 282,-455.91"/>
+<text text-anchor="middle" x="203" y="-434.21" font-family="Times,serif" font-size="14.00">StateMachineEvent</text>
+</g>
+<!-- Scheduler&#45;&gt;stimuli -->
+<g id="edge1" class="edge">
+<title>Scheduler&#45;&gt;stimuli</title>
+<path fill="none" stroke="black" d="M203,-491.6C203,-483.89 203,-474.62 203,-466.02"/>
+<polygon fill="black" stroke="black" points="206.5,-466.01 203,-456.01 199.5,-466.01 206.5,-466.01"/>
+</g>
+<!-- Worker_handle_stimulus -->
+<g id="node4" class="node">
+<title>Worker_handle_stimulus</title>
+<ellipse fill="none" stroke="black" cx="303" cy="-336.43" rx="92.88" ry="18"/>
+<text text-anchor="middle" x="303" y="-332.73" font-family="Times,serif" font-size="14.00">handle_stimulus()</text>
+</g>
+<!-- stimuli&#45;&gt;Worker_handle_stimulus -->
+<g id="edge2" class="edge">
+<title>stimuli&#45;&gt;Worker_handle_stimulus</title>
+<path fill="none" stroke="black" d="M220.42,-419.58C236.58,-403.51 260.78,-379.43 278.81,-361.5"/>
+<polygon fill="black" stroke="black" points="281.49,-363.76 286.11,-354.23 276.56,-358.8 281.49,-363.76"/>
+</g>
+<!-- Worker_execute -->
+<g id="node5" class="node">
+<title>Worker_execute</title>
+<ellipse fill="none" stroke="black" cx="104" cy="-336.43" rx="88.28" ry="37.45"/>
+<text text-anchor="middle" x="104" y="-347.73" font-family="Times,serif" font-size="14.00">execute()</text>
+<text text-anchor="middle" x="104" y="-332.73" font-family="Times,serif" font-size="14.00">gather_dep()</text>
+<text text-anchor="middle" x="104" y="-317.73" font-family="Times,serif" font-size="14.00">batched_send()</text>
+</g>
+<!-- stimuli&#45;&gt;Worker_execute -->
+<g id="edge5" class="edge">
+<title>stimuli&#45;&gt;Worker_execute</title>
+<path fill="none" stroke="black" d="M178.52,-412.31C166.25,-399.98 151.21,-384.86 137.85,-371.45"/>
+<polygon fill="black" stroke="black" points="176.22,-414.96 185.76,-419.58 181.18,-410.02 176.22,-414.96"/>
+</g>
+<!-- instructions -->
+<g id="node3" class="node">
+<title>instructions</title>
+<polygon fill="grey" stroke="grey" points="191,-134 63,-134 63,-98 191,-98 191,-134"/>
+<text text-anchor="middle" x="127" y="-112.3" font-family="Times,serif" font-size="14.00">list[Instruction]</text>
+</g>
+<!-- WorkerState_handle_stimulus -->
+<g id="node8" class="node">
+<title>WorkerState_handle_stimulus</title>
+<ellipse fill="none" stroke="black" cx="151" cy="-34" rx="92.88" ry="18"/>
+<text text-anchor="middle" x="151" y="-30.3" font-family="Times,serif" font-size="14.00">handle_stimulus()</text>
+</g>
+<!-- instructions&#45;&gt;WorkerState_handle_stimulus -->
+<g id="edge8" class="edge">
+<title>instructions&#45;&gt;WorkerState_handle_stimulus</title>
+<path fill="none" stroke="black" d="M135.16,-87.79C138.72,-75.95 142.77,-62.44 145.88,-52.05"/>
+<polygon fill="black" stroke="black" points="131.73,-87.06 132.21,-97.64 138.43,-89.07 131.73,-87.06"/>
+</g>
+<!-- BaseWorker_handle_stimulus -->
+<g id="node6" class="node">
+<title>BaseWorker_handle_stimulus</title>
+<ellipse fill="none" stroke="black" cx="303" cy="-207.48" rx="92.88" ry="18"/>
+<text text-anchor="middle" x="303" y="-203.78" font-family="Times,serif" font-size="14.00">handle_stimulus()</text>
+</g>
+<!-- Worker_handle_stimulus&#45;&gt;BaseWorker_handle_stimulus -->
+<g id="edge3" class="edge">
+<title>Worker_handle_stimulus&#45;&gt;BaseWorker_handle_stimulus</title>
+<path fill="none" stroke="black" d="M303,-318.31C303,-297.2 303,-261.06 303,-236.03"/>
+<polygon fill="black" stroke="black" points="306.5,-235.73 303,-225.73 299.5,-235.73 306.5,-235.73"/>
+</g>
+<!-- BaseWorker_execute -->
+<g id="node7" class="node">
+<title>BaseWorker_execute</title>
+<ellipse fill="none" stroke="black" cx="104" cy="-207.48" rx="88.28" ry="37.45"/>
+<text text-anchor="middle" x="104" y="-218.78" font-family="Times,serif" font-size="14.00">execute()</text>
+<text text-anchor="middle" x="104" y="-203.78" font-family="Times,serif" font-size="14.00">gather_dep()</text>
+<text text-anchor="middle" x="104" y="-188.78" font-family="Times,serif" font-size="14.00">batched_send()</text>
+</g>
+<!-- Worker_execute&#45;&gt;BaseWorker_execute -->
+<g id="edge6" class="edge">
+<title>Worker_execute&#45;&gt;BaseWorker_execute</title>
+<path fill="none" stroke="black" d="M104,-288.53C104,-274.2 104,-258.66 104,-245.11"/>
+<polygon fill="black" stroke="black" points="100.5,-288.71 104,-298.71 107.5,-288.71 100.5,-288.71"/>
+</g>
+<!-- BaseWorker_handle_stimulus&#45;&gt;WorkerState_handle_stimulus -->
+<g id="edge4" class="edge">
+<title>BaseWorker_handle_stimulus&#45;&gt;WorkerState_handle_stimulus</title>
+<path fill="none" stroke="black" d="M287.87,-189.41C260.9,-158.98 204.4,-95.25 173.09,-59.92"/>
+<polygon fill="black" stroke="black" points="175.32,-57.16 166.07,-52 170.08,-61.8 175.32,-57.16"/>
+</g>
+<!-- BaseWorker_execute&#45;&gt;instructions -->
+<g id="edge7" class="edge">
+<title>BaseWorker_execute&#45;&gt;instructions</title>
+<path fill="none" stroke="black" d="M115.85,-160.4C118.24,-151.06 120.62,-141.8 122.57,-134.25"/>
+<polygon fill="black" stroke="black" points="112.45,-159.53 113.35,-170.08 119.23,-161.27 112.45,-159.53"/>
+</g>
+</g>
+</svg>
diff --git a/docs/source/images/worker-task-state.svg b/docs/source/images/worker-task-state.svg
deleted file mode 100644
index edc4b83404..0000000000
--- a/docs/source/images/worker-task-state.svg
+++ /dev/null
@@ -1,103 +0,0 @@
-<?xml version="1.0" encoding="UTF-8" standalone="no"?>
-<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN"
- "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
-<!-- Generated by graphviz version 2.42.3 (20191010.1750)
- -->
-<!-- Title: %3 Pages: 1 -->
-<svg width="671pt" height="107pt"
- viewBox="0.00 0.00 670.96 107.00" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink">
-<g id="graph0" class="graph" transform="scale(1 1) rotate(0) translate(4 103)">
-<title>%3</title>
-<polygon fill="#ffffff" fill-opacity="0.941176" stroke="transparent" points="-4,4 -4,-103 666.96,-103 666.96,4 -4,4"/>
-<!-- new -->
-<g id="node1" class="node">
-<title>new</title>
-<ellipse fill="none" stroke="black" cx="27" cy="-45" rx="27" ry="18"/>
-<text text-anchor="middle" x="27" y="-41.3" font-family="Times,serif" font-size="14.00">new</text>
-</g>
-<!-- waiting -->
-<g id="node2" class="node">
-<title>waiting</title>
-<ellipse fill="none" stroke="black" cx="127.7" cy="-45" rx="37.89" ry="18"/>
-<text text-anchor="middle" x="127.7" y="-41.3" font-family="Times,serif" font-size="14.00">waiting</text>
-</g>
-<!-- new&#45;&gt;waiting -->
-<g id="edge1" class="edge">
-<title>new&#45;&gt;waiting</title>
-<path fill="none" stroke="black" d="M54.19,-45C62.07,-45 70.97,-45 79.77,-45"/>
-<polygon fill="black" stroke="black" points="79.98,-48.5 89.98,-45 79.98,-41.5 79.98,-48.5"/>
-</g>
-<!-- ready -->
-<g id="node3" class="node">
-<title>ready</title>
-<ellipse fill="none" stroke="black" cx="232.59" cy="-45" rx="31.4" ry="18"/>
-<text text-anchor="middle" x="232.59" y="-41.3" font-family="Times,serif" font-size="14.00">ready</text>
-</g>
-<!-- waiting&#45;&gt;ready -->
-<g id="edge2" class="edge">
-<title>waiting&#45;&gt;ready</title>
-<path fill="none" stroke="black" d="M165.55,-45C173.83,-45 182.67,-45 191.09,-45"/>
-<polygon fill="black" stroke="black" points="191.09,-48.5 201.09,-45 191.09,-41.5 191.09,-48.5"/>
-</g>
-<!-- executing -->
-<g id="node4" class="node">
-<title>executing</title>
-<ellipse fill="none" stroke="black" cx="345.93" cy="-45" rx="46.29" ry="18"/>
-<text text-anchor="middle" x="345.93" y="-41.3" font-family="Times,serif" font-size="14.00">executing</text>
-</g>
-<!-- ready&#45;&gt;executing -->
-<g id="edge3" class="edge">
-<title>ready&#45;&gt;executing</title>
-<path fill="none" stroke="black" d="M264.02,-45C271.88,-45 280.6,-45 289.32,-45"/>
-<polygon fill="black" stroke="black" points="289.51,-48.5 299.51,-45 289.51,-41.5 289.51,-48.5"/>
-</g>
-<!-- long&#45;running -->
-<g id="node5" class="node">
-<title>long&#45;running</title>
-<ellipse fill="none" stroke="black" cx="486.57" cy="-45" rx="58.49" ry="18"/>
-<text text-anchor="middle" x="486.57" y="-41.3" font-family="Times,serif" font-size="14.00">long&#45;running</text>
-</g>
-<!-- executing&#45;&gt;long&#45;running -->
-<g id="edge4" class="edge">
-<title>executing&#45;&gt;long&#45;running</title>
-<path fill="none" stroke="black" d="M392.33,-45C400.5,-45 409.18,-45 417.83,-45"/>
-<polygon fill="black" stroke="black" points="417.93,-48.5 427.93,-45 417.93,-41.5 417.93,-48.5"/>
-</g>
-<!-- memory -->
-<g id="node6" class="node">
-<title>memory</title>
-<ellipse fill="none" stroke="black" cx="622.02" cy="-81" rx="40.89" ry="18"/>
-<text text-anchor="middle" x="622.02" y="-77.3" font-family="Times,serif" font-size="14.00">memory</text>
-</g>
-<!-- executing&#45;&gt;memory -->
-<g id="edge5" class="edge">
-<title>executing&#45;&gt;memory</title>
-<path fill="none" stroke="black" d="M378.78,-57.85C393.53,-63.21 411.44,-68.9 428.08,-72 476.05,-80.92 531.81,-82.61 571.02,-82.4"/>
-<polygon fill="black" stroke="black" points="571.15,-85.9 581.11,-82.31 571.08,-78.9 571.15,-85.9"/>
-</g>
-<!-- error -->
-<g id="node7" class="node">
-<title>error</title>
-<ellipse fill="none" stroke="black" cx="622.02" cy="-18" rx="28.7" ry="18"/>
-<text text-anchor="middle" x="622.02" y="-14.3" font-family="Times,serif" font-size="14.00">error</text>
-</g>
-<!-- executing&#45;&gt;error -->
-<g id="edge6" class="edge">
-<title>executing&#45;&gt;error</title>
-<path fill="none" stroke="black" d="M378.33,-31.94C393.14,-26.46 411.23,-20.73 428.08,-18 481.54,-9.34 544.43,-11.62 583.51,-14.47"/>
-<polygon fill="black" stroke="black" points="583.39,-17.97 593.64,-15.26 583.94,-11 583.39,-17.97"/>
-</g>
-<!-- long&#45;running&#45;&gt;memory -->
-<g id="edge7" class="edge">
-<title>long&#45;running&#45;&gt;memory</title>
-<path fill="none" stroke="black" d="M531.27,-56.79C545.84,-60.72 562.09,-65.1 576.71,-69.05"/>
-<polygon fill="black" stroke="black" points="575.97,-72.47 586.53,-71.7 577.79,-65.71 575.97,-72.47"/>
-</g>
-<!-- long&#45;running&#45;&gt;error -->
-<g id="edge8" class="edge">
-<title>long&#45;running&#45;&gt;error</title>
-<path fill="none" stroke="black" d="M536.13,-35.18C552.11,-31.94 569.6,-28.4 584.53,-25.38"/>
-<polygon fill="black" stroke="black" points="585.3,-28.8 594.41,-23.38 583.91,-21.94 585.3,-28.8"/>
-</g>
-</g>
-</svg>
diff --git a/docs/source/index.rst b/docs/source/index.rst
index 6ae9744395..2c76cb5f68 100644
--- a/docs/source/index.rst
+++ b/docs/source/index.rst
@@ -100,6 +100,7 @@ Contents
    scheduling-policies
    scheduling-state
    worker
+   worker-state
    worker-memory
    work-stealing
    killed
diff --git a/docs/source/scheduling-state.rst b/docs/source/scheduling-state.rst
index 3e8dfb4e81..9354b8f6b7 100644
--- a/docs/source/scheduling-state.rst
+++ b/docs/source/scheduling-state.rst
@@ -1,5 +1,5 @@
-Scheduling State
-================
+Scheduler State Machine
+=======================
 
 .. currentmodule:: distributed.scheduler
 
@@ -60,33 +60,42 @@ Tasks flow along the following states with the following allowed transitions:
 .. image:: images/task-state.svg
     :alt: Dask scheduler task states
 
-*  *Released*: Known but not actively computing or in memory
-*  *Waiting*: On track to be computed, waiting on dependencies to arrive in
-   memory
-*  *No-worker*: Ready to be computed, but no appropriate worker exists
-   (for example because of resource restrictions, or because no worker is
-   connected at all).
-*  *Processing*: All dependencies are available and the task is assigned to a
-   worker for compute (the scheduler doesn't know whether it's in a worker
-   queue or actively being computed).
-*  *Memory*: In memory on one or more workers
-*  *Erred*: Task computation, or one of its dependencies, has encountered an error
-*  *Forgotten* (not actually a state): Task is no longer needed by any client
-   or dependent task
+released
+    Known but not actively computing or in memory
+waiting
+    On track to be computed, waiting on dependencies to arrive in memory
+no-worker
+    Ready to be computed, but no appropriate worker exists (for example because of
+    resource restrictions, or because no worker is connected at all).
+processing
+    All dependencies are available and the task is assigned to a worker for compute (the
+    scheduler doesn't know whether it's in a worker queue or actively being computed).
+memory
+    In memory on one or more workers
+erred
+    Task computation, or one of its dependencies, has encountered an error
+forgotten
+    Task is no longer needed by any client or dependent task, so it disappears from the
+    scheduler as well. As soon as a task reaches this state, it is immediately
+    dereferenced from the scheduler.
+
+.. note::
+    There's no intermediate state between ``waiting`` / ``no-worker`` and
+    ``processing``: as soon as a task has all of its dependencies in memory somewhere on
+    the cluster, it is immediately assigned to a worker. This can lead to very long task
+    queues on the workers, which are then rebalanced dynamically through
+    :doc:`work-stealing`.
 
 In addition to the literal state, though, other information needs to be
 kept and updated about each task.  Individual task state is stored in an
-object named :class:`TaskState` and consists of the following information:
-
-.. autoclass:: TaskState
-    :members:
+object named :class:`TaskState`; see full API through the link.
 
 The scheduler keeps track of all the :class:`TaskState` objects (those
 not in the "forgotten" state) using several containers:
 
 .. attribute:: tasks: {str: TaskState}
 
-   A dictionary mapping task keys (usually strings) to :class:`TaskState`
+   A dictionary mapping task keys (always strings) to :class:`TaskState`
    objects.  Task keys are how information about tasks is communicated
    between the scheduler and clients, or the scheduler and workers; this
    dictionary is then used to find the corresponding :class:`TaskState`
@@ -99,17 +108,23 @@ not in the "forgotten" state) using several containers:
    (their :attr:`~TaskState.waiting_on` set is empty), and are waiting
    for an appropriate worker to join the network before computing.
 
+Once a task is queued up on a worker, it is also tracked on the worker side by the
+:doc:`worker-state`.
+
 
 Worker State
 ------------
 
-Each worker's current state is stored in a :class:`WorkerState` object.
+Each worker's current state is stored in a :class:`WorkerState` object; see full API
+through the link.
+
+This is a scheduler-side object, which holds information about what the scheduler
+knows about each worker on the cluster, and is not to be confused with
+:class:`distributed.worker-state-machine.WorkerState`.
+
 This information is involved in deciding
 :ref:`which worker to run a task on <decide-worker>`.
 
-.. autoclass:: WorkerState
-    :members:
-
 In addition to individual worker state, the scheduler maintains two
 containers to help with scheduling tasks:
 
@@ -136,13 +151,7 @@ Client State
 ------------
 
 Information about each individual client of the scheduler is kept
-in a :class:`ClientState` object:
-
-.. autoclass:: ClientState
-    :members:
-
-
-.. XXX list invariants somewhere?
+in a :class:`ClientState` object; see full API through the link.
 
 
 Understanding a Task's Flow
@@ -215,6 +224,8 @@ memory → forgotten                   nbytes
    :attr:`WorkerState.nbytes`.
 
 
+.. _scheduling_state_implementation:
+
 Implementation
 --------------
 
@@ -224,21 +235,21 @@ name of the start and finish task state like the following.
 
 .. code-block:: python
 
-   def transition_released_waiting(self, key):
+   def transition_released_waiting(self, key, stimulus_id): ...
 
-   def transition_processing_memory(self, key):
+   def transition_processing_memory(self, key, stimulus_id): ...
 
-   def transition_processing_erred(self, key):
+   def transition_processing_erred(self, key, stimulus_id): ...
 
 These functions each have three effects.
 
 1.  They perform the necessary transformations on the scheduler state (the 20
     dicts/lists/sets) to move one key between states.
 2.  They return a dictionary of recommended ``{key: state}`` transitions to
-    enact directly afterwards on other keys.  For example after we transition a
-    key into memory we may find that many waiting keys are now ready to
+    enact directly afterwards on other keys. For example, after we transition a
+    key into memory, we may find that many waiting keys are now ready to
     transition from waiting to a ready state.
-3.  Optionally they include a set of validation checks that can be turned on
+3.  Optionally, they include a set of validation checks that can be turned on
     for testing.
 
 Rather than call these functions directly we call the central function
@@ -246,8 +257,7 @@ Rather than call these functions directly we call the central function
 
 .. code-block:: python
 
-   def transition(self, key, final_state):
-       """ Transition key to the suggested state """
+   def transition(self, key, final_state, stimulus_id): ...
 
 This transition function finds the appropriate path from the current to the
 final state.  It also serves as a central point for logging and diagnostics.
@@ -258,7 +268,7 @@ steady state.  For that we use the ``transitions`` function (note the plural ``s
 
 .. code-block:: python
 
-   def transitions(self, recommendations):
+   def transitions(self, recommendations, stimulus_id):
        recommendations = recommendations.copy()
        while recommendations:
            key, finish = recommendations.popitem()
@@ -276,17 +286,55 @@ Transitions occur from stimuli, which are state-changing messages to the
 scheduler from workers or clients.  The scheduler responds to the following
 stimuli:
 
-* **Workers**
-    * Task finished: A task has completed on a worker and is now in memory
-    * Task erred: A task ran and erred on a worker
-    * Task missing data: A task tried to run but was unable to find necessary
-      data on other workers
-    * Worker added: A new worker was added to the network
-    * Worker removed: An existing worker left the network
-
-* **Clients**
-    * Update graph: The client sends more tasks to the scheduler
-    * Release keys: The client no longer desires the result of certain keys
+**Workers**
+
+task-finished
+    A task has completed on a worker and is now in memory
+task-erred
+    A task ran and erred on a worker
+reschedule
+    A task has completed on a worker by raising :class:`~distributed.Reschedule`
+long-running
+    A task is still running on the worker, but it called :func:`~distributed.secede`
+add-keys
+    Replication finished. One or more tasks, which were previously in memory on other
+    workers, are now in memory on one additional worker. Also used to inform the
+    scheduler of a successful :func:`~distributed.Client.scatter` operation.
+request-refresh-who-has
+    All peers that hold a replica of a task in memory that a worker knows of are
+    unavailable (temporarily or permanently), so the worker can't fetch it and is asking
+    the scheduler if it knows of any additional replicas. This call is repeated
+    periodically until a new replica appears.
+release-worker-data
+    A worker informs that the scheduler that it no longer holds the task in memory
+worker-status-change
+    The global status of a worker has just changed, e.g. between ``running`` and
+    ``paused``.
+log-event
+    A generic event happend on the worker, which should be logged centrally.
+    Note that this is in addition to the worker's log, which the client can fetch on
+    request (up to a certain length).
+keep-alive
+    A worker informs that it's still online and responsive. This uses the batched stream
+    channel, as opposed to :meth:`distributed.worker.Worker.heartbeat` and
+    :meth:`Scheduler.heartbeat_worker` which use dedicated RPC comms, and is needed to
+    prevent firewalls from closing down the batched stream.
+register-worker
+    A new worker was added to the network
+unregister
+    An existing worker left the network
+
+
+**Clients**
+
+update-graph
+    The client sends more tasks to the scheduler
+client-releases-keys
+    The client no longer desires the result of certain keys.
+
+Note that there are many more client API endpoints (e.g. to serve
+:func:`~distributed.Client.scatter` etc.), which are not listed here for the sake of
+brevity.
 
 Stimuli functions are prepended with the text ``stimulus``, and take a variety
 of keyword arguments from the message as in the following examples:
@@ -315,6 +363,15 @@ API
    :members:
    :inherited-members:
 
+.. autoclass:: TaskState
+    :members:
+
+.. autoclass:: WorkerState
+    :members:
+
+.. autoclass:: ClientState
+    :members:
+
 .. autofunction:: decide_worker
 
 .. autoclass:: MemoryState
diff --git a/docs/source/worker-state.rst b/docs/source/worker-state.rst
new file mode 100644
index 0000000000..a9dce7c26b
--- /dev/null
+++ b/docs/source/worker-state.rst
@@ -0,0 +1,459 @@
+Worker State Machine
+====================
+
+.. currentmodule:: distributed.worker_state_machine
+
+
+Task states
+-----------
+
+When the Scheduler asks a Worker to compute a task, it is tracked by the Worker through
+a :class:`distributed.worker_state_machine.TaskState` object - not to be confused with
+the matching scheduler-side class :class:`distributed.scheduler.TaskState`.
+
+The class has a key attribute, :attr:`TaskState.state`, which can assume the following
+values:
+
+released
+    Known but not actively computing or in memory. A task can stay in this state when
+    the scheduler asked to forget it, but it has dependent tasks on the same worker.
+waiting
+    The scheduler has added the task to the worker queue. All of its dependencies are
+    in memory somewhere on the cluster, but not all of them are in memory on the current
+    worker, so they need to be fetched.
+fetch
+    This task is in memory on one or more peer workers, but not on this worker. Its data
+    is queued to be transferred over the network, either because it's a dependency of a
+    task in ``waiting`` state, or because the :doc:`active_memory_manager` requested it
+    to be replicated here.
+    The task can be found in the :attr:`WorkerState.data_needed` heap.
+missing
+    Like ``fetch``, but all peer workers that were listed by the scheduler are either
+    unreachable or have responded they don't actually have the task data. The worker
+    will periodically ask the scheduler if it knows of additional replicas; when it
+    does, the task will transition again to ``fetch``.
+    The task can be found in the :attr:`WorkerState.missing_dep_flight` set.
+flight
+    The task data is currently being transferred over the network from another worker.
+    The task can be found in the :attr:`WorkerState.in_flight_tasks` and
+    :attr:`WorkerState.in_flight_workers` collections.
+ready
+    The task is ready to be computed; all of its dependencies are in memory on the
+    current worker and it's waiting for an available thread.
+    The task can be found in the :attr:`WorkerState.ready` heap.
+constrained
+    Like ``ready``, but the user specified :doc:`resource constraints <resources>` for
+    this task.
+    The task can be found in the :attr:`WorkerState.constrained` queue.
+executing
+    The task is currently being computed on a thread.
+    It can be found in the :attr:`WorkerState.executing` set and in the
+    :attr:`distributed.worker.Worker.active_threads` dict.
+long-running
+    Like ``executing``, but the user code called :func:`distributed.secede` so the task
+    no longer counts towards the maximum number of concurrent tasks.
+    It can be found in the :attr:`WorkerState.long_running` set and in the
+    :attr:`distributed.worker.Worker.active_threads` dict.
+rescheduled
+    The task just raised the :class:`~distributed.Reschedule` exception. This is a
+    transitory state, which is not stored permanently.
+cancelled
+    The scheduler asked to forget about this task, but it's technically impossible at
+    the moment. See :ref:`cancelled-tasks`. The task can be found in whatever
+    collections it was in its :attr:`~TaskState.previous` state.
+resumed
+    The task was recovered from ``cancelled`` state. See :ref:`cancelled-tasks`.
+    The task can be found in whatever collections it was in its
+    :attr:`~TaskState.previous` state.
+memory
+    Task execution completed, or the task was successfully transferred from another
+    worker, and is now held in either :class:`WorkerState.data` or
+    :class:`WorkerState.actors`.
+error
+    Task execution failed. Alternatively, task execution completed successfully, or the
+    task data transferred successfully over the network, but it failed to serialize or
+    deserialize. The full exception and traceback are stored in the task itself, so that
+    they can be re-raised on the client.
+forgotten
+    The scheduler asked this worker to forget abot the task, and there are neither
+    dependents nor dependencies on the same worker. As soon as a task reaches this
+    state, it is immediately dereferenced from the :class:`WorkerState` and will be soon
+    garbage-collected. This is the only case where two instances of a :class:`TaskState`
+    object with the same :attr:`~TaskState.key` can (transitorily) exist in the same
+    interpreter at the same time.
+
+
+Fetching dependencies
+---------------------
+
+.. image:: images/worker-dep-state.svg
+    :alt: Worker states for dependencies
+
+As tasks that need to be computed arrive on the Worker, any dependencies that are not
+already in memory on the same worker are wrapped by a :class:`TaskState` object and
+contain a listing of workers (:attr:`TaskState.who_has`) to collect their result from.
+
+These :class:`TaskState` objects have their state set to ``fetch``, are put in the
+:attr:`~WorkerState.data_needed` heap, and are progressively transferred over the
+network. For each dependency we select a worker at random that has that data and collect
+the dependency from that worker. To improve bandwidth, we opportunistically gather other
+dependencies of other tasks that are known to be on that worker, up to a maximum of 50MB
+of data (:attr:`~WorkerState.transfer_message_target_bytes`) - too little data and
+bandwidth suffers, too much data and responsiveness suffers. We use a fixed number of 50
+connections (:attr:`~WorkerState.transfer_incoming_count_limit`, which is in turn
+acquired from the configuration key ``distributed.worker.connections.outgoing``) so as
+to avoid overly-fragmenting our network bandwidth.
+
+In the event that the network comms between two workers are saturated, a dependency task
+may cycle between ``fetch`` and ``flight`` until it is successfully collected. It may
+also happen that a peer worker responds that it doesn't have a replica of the requested
+data anymore; finally, the peer worker may be unreachable or unresponsive. When that
+happens, the peer is removed from :attr:`~TaskState.who_has` and the task is
+transitioned back to ``fetch``, so that the Worker will try gathering the same key from
+a different peer. If :attr:`~TaskState.who_has` becomes empty due to this process, the
+task transitions to ``missing`` and the Worker starts periodically asking the Scheduler
+if additional peers are available.
+
+The same system used for fetching dependencies is also used by
+:doc:`active_memory_manager` replication.
+
+.. note::
+   There is at most one :meth:`~BaseWorker.gather_dep` asyncio task running at any
+   given time for any given peer worker. If all workers holding a replica of a task
+   in ``fetch`` state are already in flight, the task will remain in ``fetch`` state
+   until a worker becomes available again.
+
+
+Computing tasks
+---------------
+A :class:`TaskState` that needs to be computed proceeds on the Worker through the
+following pipeline. It has its :attr:`~TaskState.run_spec` defined, which instructs the
+worker how to execute it.
+
+.. image:: images/worker-execute-state.svg
+    :alt: Worker states for computing tasks
+
+After all dependencies for a task are in memory, the task transitions from ``waiting``
+to ``ready`` or ``constrained`` and is added to the :attr:`~WorkerState.ready` heap.
+
+As soon as a thread is available, we pop a task from the top of the heap and put the
+task into a thread from a local thread pool to execute.
+
+Optionally, while it's running, this task may identify itself as a long-running task
+(see :doc:`Tasks launching tasks <task-launch>`), at which point it secedes from the
+thread pool and changes state to `long-running`. ``executing`` and ``long-running`` are
+almost identical states, the only difference being that the latter don't count towards
+the maximum number of tasks running in parallel at the same time.
+
+A task can terminate in three ways:
+
+- Complete successfully; its return value is stored in either :attr:`~WorkerState.data`
+  or :attr:`~WorkerState.actors`
+- Raise an exception; the exception and traceback are stored on the :class:`TaskState`
+  object
+- Raise :class:`~distributed.Reschedule`; it is immediately forgotten.
+
+In all cases, the outcome is sent back to the scheduler.
+
+
+Scattered data
+--------------
+:meth:`Scattered data <distributed.Client.scatter>` follows an even simpler path,
+landing directly in ``memory``:
+
+.. image:: images/worker-scatter-state.svg
+    :alt: Worker states for scattered data
+
+
+Forgetting tasks
+----------------
+Once a task is in ``memory`` or ``error``, the Worker will hold onto it indefinitely,
+until the Scheduler explicitly asks the Worker to forget it.
+This happens when there are no more Clients holding a reference to the key and there are
+no more waiter tasks (that is, dependents that have not been computed). Additionally,
+the :doc:`active_memory_manager` may ask to drop excess replicas of a task.
+
+In the case of ``rescheduled``, the task will instead immediately transition to
+``released`` and then ``forgotten`` without waiting for the scheduler.
+
+.. image:: images/worker-forget-state.svg
+    :alt: Worker states for computing tasks
+
+
+Irregular flow
+--------------
+There are a few important exceptions to the flow diagrams above:
+
+- A task is `stolen <work-stealing>`_, in which case it transitions from ``waiting``,
+  ``ready``, or ``constrained`` directly to ``released``. Note that steal requests for
+  tasks that are currently executing are rejected.
+- Scheduler intercession, in which the scheduler reassigns a task that was
+  previously assigned to a separate worker to a new worker. This most commonly
+  occurs when a :doc:`worker dies <killed>` during computation.
+- Client intercession, where a client either explicitly releases a Future or descopes
+  it; alternatively the whole client may shut down or become unresponsive. When there
+  are no more clients holding references to a key or one of its dependents, the
+  Scheduler will release it.
+
+In short:
+
+.. important::
+   A task can transition to ``released`` from *any* state, not just those in the
+   diagrams above.
+
+If there are no dependants, the task immediately transitions to ``forgotten`` and is
+descoped. However, there is an important exception, :ref:`cancelled-tasks`.
+
+
+.. _cancelled-tasks:
+
+Task cancellation
+-----------------
+The Worker may receive a request to release a key while it is currently in ``flight``,
+``executing``, or ``long-running``. Due to technical limitations around cancelling
+Python threads, and the way data fetching from peer workers is currently implemented,
+such an event cannot cause the related asyncio task (and, in the case of ``executing`` /
+``long-running``, the thread running the user code) to be immediately aborted. Instead,
+tasks in these three states are instead transitioned to another state, ``cancelled``,
+which means that the asyncio task will proceed to completion (outcome is irrelevant) and
+then* the Dask task will be released.
+
+The ``cancelled`` state has a substate, :attr:`~TaskState.previous`, which is set to one
+of the above three states. The common notation for this ``<state>(<previous>)``,
+e.g. ``cancelled(flight)``.
+
+While a task is cancelled, one of three things will happen:
+
+- Nothing happens before the asyncio task completes; e.g. the Scheduler does not change
+  its mind and still wants the Worker to forget about the task until the very end.
+  When that happens, the task transitions from ``cancelled`` to ``released`` and,
+  typically, ``forgotten``.
+- The scheduler switches back to its original request:
+
+  - The scheduler asks the Worker to fetch a task that is currently
+    ``cancelled(flight)``; at which point the task will immediately revert to
+    ``flight``, forget that cancellation ever happened, and continue waiting on the data
+    fetch that's already running;
+  - The scheduler asks the Worker to compute a task that is currently
+    ``cancelled(executing)`` or ``cancelled(long-running)``. The Worker will completely
+    disregard the new :attr:`~TaskState.run_spec` (if it changed), switch back to the
+    :attr:`~TaskState.previous` state, and wait for the already executing thread to
+    finish.
+
+- The scheduler flips to the opposite request, from fetch to computation or the other
+  way around.
+
+To serve this last use case there is another special state, ``resumed``. A task can
+enter ``resumed`` state exclusively from ``cancelled``. ``resumed`` retains the
+:attr:`~TaskState.previous` attribute from the ``cancelled`` state and adds another
+attribute, :attr:`~TaskState.next`, which is always:
+
+- ``fetch``, if :attr:`~TaskState.previous` is ``executing`` or ``long-running``
+- ``waiting``, if :attr:`~TaskState.previous` is ``flight``
+
+To recap, these are all possible permutations of states and substates to handle
+cancelled tasks:
+
+========= ============ =======
+state     previous     next
+========= ============ =======
+cancelled flight       None
+cancelled executing    None
+cancelled long-running None
+resumed   flight       waiting
+resumed   executing    fetch
+resumed   long-running fetch
+========= ============ =======
+
+If a ``resumed`` task completes successfully, it will transition to ``memory`` (as
+opposed to a ``cancelled`` task, where the output is disregarded) and the Scheduler
+will be informed with a spoofed termination message, that is the expected end message
+for ``flight`` if the task is ``resumed(executing->fetch)`` or
+``resumed(long-running->fetch)``, and the expected end message for ``execute`` if
+the task is ``resumed(flight->waiting)``.
+
+If the task fails or raises :class:`~distributed.Reschedule`, the Worker will instead
+silently ignore the exception and switch to its intended course, so
+``resumed(executing->fetch)`` or ``resumed(long-running->fetch)`` will transition to
+``fetch`` and ``resumed(flight->waiting)`` will transition to ``waiting``.
+
+Finally, the scheduler can change its mind multiple times over the lifetime of the task,
+so a ``resumed(executing->fetch)`` or ``resumed(long-running->fetch)`` task may be
+requested to transition to ``waiting`` again, at which point it will just revert to its
+:attr:`~TaskState.previous` state and forget the whole incident; likewise a
+``resumed(flight->waiting)`` task could be requested to transition to ``fetch`` again,
+so it will just transition to ``flight`` instead.
+
+.. image:: images/worker-cancel-state1.svg
+    :alt: Worker states for cancel/resume
+
+.. image:: images/worker-cancel-state2.svg
+    :alt: Worker states for cancel/resume
+
+
+**A common real-life use case**
+
+1. There are at least two workers on the cluster, A and B.
+2. Task x is computed successfully on worker A.
+3. When task x transitions to memory on worker A, the scheduler asks worker B to compute
+   task y, which depends on task x.
+4. B starts acquiring the key x from A, which sends the task into ``flight`` mode.
+5. Worker A crashes, and for whatever reason the scheduler notices before worker B does.
+6. The scheduler will release task y (because it's waiting on dependencies that are
+   nowhere to be found in memory anymore) and reschedule task x somewhere else on the
+   cluster. Task x will transition to ``cancelled(flight)`` on worker A.
+7. If the scheduler randomly chooses worker A to compute task X, the task will
+   transition to ``resumed(flight->waiting)``.
+8. When, *and only when*, the TCP socket from A to B collapses (e.g. due to timeout),
+   the task will transition to ``waiting`` and will be eventually recomputed on A.
+
+.. important::
+
+   You always have *at most* one :meth:`~WorkerBase.compute` or
+   :meth:`~WorkerBase.gather_dep` asyncio task running for any one given key; you
+   never have both.
+
+
+Task state mapping between Scheduler and Worker
+-----------------------------------------------
+
+The task states on the scheduler and the worker are different, and their mapping is
+somewhat nuanced:
+
++------------------+-----------------------+-------------------------+
+| Scheduler states | Typical worker states | Edge case worker states |
++==================+=======================+=========================+
+| - released       | - (unknown)           | - released              |
+| - waiting        |                       | - cancelled             |
+| - no-worker      |                       |                         |
++------------------+-----------------------+-------------------------+
+| - processing     | - waiting             | - resumed(waiting)      |
+|                  | - ready               |                         |
+|                  | - constrained         |                         |
+|                  | - executing           |                         |
+|                  | - long-running        |                         |
++------------------+-----------------------+-------------------------+
+| - memory         | - memory              | - error                 |
+|                  | - fetch               | - missing               |
+|                  | - flight              | - resumed(fetch)        |
++------------------+-----------------------+-------------------------+
+| - erred          | - error               |                         |
++------------------+-----------------------+-------------------------+
+
+In addition to the above states, a worker may not know about a specific task at all.
+The opposite, where the worker knows about a task but it is nowhere to be found on the
+scheduler, happens exclusively in the case of :ref:`cancelled-tasks`.
+
+There are also *race conditions* to be considered, where a worker (or some workers) know
+something before the scheduler does, or the other way around. For example,
+
+- A task will always transition from ``executing`` to ``memory`` on the worker before
+  it can transition from ``processing`` to ``memory`` on the scheduler
+- A task will always transition to ``released`` or ``forgotten`` on the scheduler first,
+  and only when the message reaches the worker it will be released there too.
+
+
+Flow control
+------------
+.. image:: images/worker-state-machine.svg
+    :alt: Worker state machine control flow
+
+There are several classes involved in the worker state machine:
+
+:class:`TaskState` includes all the information related to a single task; it also
+includes references to dependent and dependency tasks. This is just a data holder, with
+no mutating methods. Note that this is a distinct class from
+:class:`distributed.scheduler.TaskState`.
+
+:class:`WorkerState` encapsulates the state of the worker as a whole. It holds
+references to :class:`TaskState` in its :attr:`~WorkerState.tasks` dictionary and in
+several other secondary collections. Crucially, this class has no knowledge or
+visibility whatsoever on asyncio, networking, disk I/O, threads, etc.
+Note that this is a distinct class from :class:`distributed.scheduler.WorkerState`.
+
+:class:`WorkerState` offers a single method to mutate the state:
+:meth:`~WorkerState.handle_stimulus`. The state must not be altered in any other way.
+The method acquires a :class:`StateMachineEvent`, a.k.a. *stimulus*, which is a data
+class which determines that something happened which may cause the worker state to
+mutate. A stimulus can arrive from either the scheduler (e.g. a request to compute a
+task) or from the worker itself (e.g. a task has finished computing).
+
+:meth:`WorkerState.handle_stimulus` alters the internal state (e.g., it could transition
+a task from ``executing`` to ``memory``) and returns a list of :class:`Instruction`
+objects, which are actions that the worker needs to take but are external to the state
+itself:
+
+- send a message to the scheduler
+- compute a task
+- gather a task from a peer worker
+
+:meth:`WorkerState.handle_stimulus` is wrapped by :meth:`BaseWorker.handle_stimulus`,
+which consumes the :class:`Instruction` objects. :class:`BaseWorker` deals with asyncio
+task creation, tracking, and cleanup, but does not actually implement the actual task
+execution or gather; instead it exposes abstract async methods
+:meth:`~BaseWorker.execute` and :meth:`~BaseWorker.gather_dep`, which are then
+overridden by its subclass :class:`~distributed.Worker`, which actually runs tasks and
+performs network I/O. When the implemented methods finish, they must return a
+:class:`StateMachineEvent`, which is fed back into :meth:`BaseWorker.handle_stimulus`.
+
+.. note::
+   This can create a (potentially very long) chain of events internal to the worker;
+   e.g. if there are more tasks in the :attr:`~WorkerState.ready` queue than there are
+   threads, then the termination :class:`StateMachineEvent` of one task will trigger the
+   :class:`Instruction` to execute the next one.
+
+To summarize:
+
+- :class:`WorkerState` is agnostic to asyncio, networking, threading, and disk I/O; it
+  includes collections of :class:`TaskState` objects.
+- :class:`BaseWorker` encapsulates :class:`WorkerState` and adds awareness of asyncio
+- :class:`~distributed.Worker` subclasses :class:`BaseWorker` and adds awereness of
+  networking, threading, and disk I/O.
+
+
+Internal state permutation
+--------------------------
+Internally, :meth:`WorkerState.handle_stimulus` works very similarly to
+:ref:`the same process on the scheduler side <scheduling_state_implementation>`:
+
+#. :meth:`WorkerState.handle_stimulus` calls ``WorkerState._handle_<stimulus name>()``,
+#. which returns a tuple of
+
+   - *recommendations* to transition tasks: {:class:`TaskState`: <new state>}
+   - list of :class:`Instruction` objects
+
+#. :meth:`WorkerState.handle_stimulus` then passes the recommendations to
+   :meth:`WorkerState._transitions`
+#. For each recommendation, :meth:`WorkerState._transitions` calls
+   :meth:`WorkerState._transition`,
+#. which in turn calls ``WorkerState._transition_<start state>_<end state>()``,
+#. which in turn returns an additional tuple of (recommendations, instructions)
+#. the new recommendations are consumed by :meth:`WorkerState._transitions`, until no
+   more recommendations are returned.
+#. :meth:`WorkerState.handle_stimulus` finally returns the list of instructions, which
+   has been progressively extended by the transitions.
+
+
+API Documentation
+-----------------
+
+.. autoclass:: TaskState
+   :members:
+
+.. autoclass:: WorkerState
+   :members:
+
+.. autoclass:: BaseWorker
+   :members:
+
+.. autoclass:: StateMachineEvent
+   :members:
+
+.. autoclass:: Instruction
+    :members:
+
+.. note::
+   :class:`StateMachineEvent` and :class:`Instruction` are abstract classes, with many
+   subclasses which are not listed here for the sake of brevity.
+   Refer to the implementation module :mod:`distributed.worker_state_machine` for the
+   full list.
diff --git a/docs/source/worker.rst b/docs/source/worker.rst
index b3d9f8c0cb..9042e24191 100644
--- a/docs/source/worker.rst
+++ b/docs/source/worker.rst
@@ -93,58 +93,13 @@ more details on the command line options, please have a look at the
 
 Internal Scheduling
 -------------------
+See dedicated page: :doc:`worker-state`
 
-Internally tasks that come to the scheduler proceed through the following pipeline as
-:class:`distributed.worker_state_machine.TaskState` objects. Tasks which follow this
-path have a :attr:`~distributed.worker_state_machine.TaskState.runspec` defined which
-instructs the worker how to execute them.
 
-.. image:: images/worker-task-state.svg
-    :alt: Dask worker task states
-
-Data dependencies are also represented as
-:class:`~distributed.worker_state_machine.TaskState` objects and follow a simpler path
-through the execution pipeline. These tasks do not have a
-:attr:`~distributed.worker_state_machine.TaskState.runspec` defined and instead contain
-a listing of workers to collect their result from.
-
-
-.. image:: images/worker-dep-state.svg
-    :alt: Dask worker dependency states
-
-As tasks arrive they are prioritized and put into a heap.  They are then taken
-from this heap in turn to have any remote dependencies collected.  For each
-dependency we select a worker at random that has that data and collect the
-dependency from that worker.  To improve bandwidth we opportunistically gather
-other dependencies of other tasks that are known to be on that worker, up to a
-maximum of 200MB of data (too little data and bandwidth suffers, too much data
-and responsiveness suffers).  We use a fixed number of connections (around
-10-50) so as to avoid overly-fragmenting our network bandwidth. In the event
-that the network comms between two workers are saturated, a dependency task may
-cycle between ``fetch`` and ``flight`` until it is successfully collected.
-
-After all dependencies for a task are in memory we transition the task to the
-ready state and put the task again into a heap of tasks that are ready to run.
-
-We collect from this heap and put the task into a thread from a local thread
-pool to execute.
-
-Optionally, this task may identify itself as a long-running task (see
-:doc:`Tasks launching tasks <task-launch>`), at which point it secedes from the
-thread pool.
-
-A task either errs or its result is put into memory.  In either case a response
-is sent back to the scheduler.
-
-Tasks slated for execution and tasks marked for collection from other workers
-must follow their respective transition paths as defined above. The only
-exceptions to this are when:
-
-* A task is `stolen <work-stealing>`_, in which case a task which might have
-  been collected will instead be executed on the thieving worker
-* Scheduler intercession, in which the scheduler reassigns a task that was
-  previously assigned to a separate worker to a new worker.  This most commonly
-  occurs when a `worker dies <killed>`_ during computation.
+API Documentation
+-----------------
+.. autoclass:: distributed.worker.Worker
+   :members:
 
 
 .. _nanny:
@@ -157,23 +112,3 @@ process.
 
 .. autoclass:: distributed.nanny.Nanny
    :members:
-
-
-API Documentation
------------------
-
-.. currentmodule:: distributed.worker_state_machine
-
-.. autoclass:: distributed.worker_state_machine.TaskState
-   :members:
-
-.. autoclass:: distributed.worker_state_machine.WorkerState
-   :members:
-
-.. autoclass:: distributed.worker_state_machine.BaseWorker
-   :members:
-
-.. currentmodule:: distributed.worker
-
-.. autoclass:: distributed.worker.Worker
-   :members: