Diagnostics documentation (#540)

tomwhite · web-flow · commit bdf6dba80ecb · 2024-08-07T10:30:47.000+01:00
diff --git a/docs/images/cubed-add.svg b/docs/images/cubed-add.svg
@@ -0,0 +1,132 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN"
+ "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
+<!-- Generated by graphviz version 10.0.1 (20240210.2158)
+ -->
+<!-- Pages: 1 -->
+<svg width="230pt" height="319pt"
+ viewBox="0.00 0.00 229.75 318.75" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink">
+<g id="graph0" class="graph" transform="scale(1 1) rotate(0) translate(4 314.75)">
+<polygon fill="white" stroke="none" points="-4,4 -4,-314.75 225.75,-314.75 225.75,4 -4,4"/>
+<text text-anchor="start" x="8" y="-39.5" font-family="Times,serif" font-size="10.00">num tasks: 5</text>
+<text text-anchor="start" x="8" y="-28.25" font-family="Times,serif" font-size="10.00">max projected memory: 100.0 MB</text>
+<text text-anchor="start" x="8" y="-17" font-family="Times,serif" font-size="10.00">total nbytes written: 72 bytes</text>
+<text text-anchor="start" x="8" y="-5.75" font-family="Times,serif" font-size="10.00">optimized: True</text>
+<!-- op&#45;001 -->
+<g id="node1" class="node">
+<title>op&#45;001</title>
+<g id="a_node1"><a xlink:title="name: op&#45;001&#10;op: asarray&#10;calls: &lt;module&gt; &#45;&gt; asarray&#10;line: 1 in &lt;module&gt;">
+<path fill="none" stroke="black" d="M43.25,-310.75C43.25,-310.75 13.25,-310.75 13.25,-310.75 7.25,-310.75 1.25,-304.75 1.25,-298.75 1.25,-298.75 1.25,-286.75 1.25,-286.75 1.25,-280.75 7.25,-274.75 13.25,-274.75 13.25,-274.75 43.25,-274.75 43.25,-274.75 49.25,-274.75 55.25,-280.75 55.25,-286.75 55.25,-286.75 55.25,-298.75 55.25,-298.75 55.25,-304.75 49.25,-310.75 43.25,-310.75"/>
+<text text-anchor="middle" x="28.25" y="-294.5" font-family="Helvetica,sans-Serif" font-size="10.00">op&#45;001</text>
+<text text-anchor="middle" x="28.25" y="-283.25" font-family="Helvetica,sans-Serif" font-size="10.00">asarray</text>
+</a>
+</g>
+</g>
+<!-- array&#45;001 -->
+<g id="node2" class="node">
+<title>array&#45;001</title>
+<g id="a_node2"><a xlink:title="name: array&#45;001&#10;variable: a&#10;shape: (3, 3)&#10;chunks: (2, 2)&#10;dtype: int64&#10;chunk memory: 32 bytes">
+<polygon fill="none" stroke="black" points="56.5,-238.75 0,-238.75 0,-202.75 56.5,-202.75 56.5,-238.75"/>
+<text text-anchor="middle" x="28.25" y="-222.5" font-family="Helvetica,sans-Serif" font-size="10.00">array&#45;001</text>
+<text text-anchor="middle" x="28.25" y="-211.25" font-family="Helvetica,sans-Serif" font-size="10.00">a</text>
+</a>
+</g>
+</g>
+<!-- op&#45;001&#45;&gt;array&#45;001 -->
+<g id="edge1" class="edge">
+<title>op&#45;001&#45;&gt;array&#45;001</title>
+<path fill="none" stroke="black" d="M28.25,-274.45C28.25,-267.16 28.25,-258.48 28.25,-250.29"/>
+<polygon fill="black" stroke="black" points="31.75,-250.37 28.25,-240.37 24.75,-250.37 31.75,-250.37"/>
+</g>
+<!-- op&#45;003 -->
+<g id="node5" class="node">
+<title>op&#45;003</title>
+<g id="a_node5"><a xlink:title="name: op&#45;003&#10;op: blockwise&#10;projected memory: 100.0 MB&#10;tasks: 4&#10;num input blocks: (1, 1)&#10;calls: &lt;module&gt; &#45;&gt; add &#45;&gt; elemwise &#45;&gt; blockwise&#10;line: 1 in &lt;module&gt;">
+<path fill="#dcbeff" stroke="black" d="M80.25,-166.75C80.25,-166.75 50.25,-166.75 50.25,-166.75 44.25,-166.75 38.25,-160.75 38.25,-154.75 38.25,-154.75 38.25,-137 38.25,-137 38.25,-131 44.25,-125 50.25,-125 50.25,-125 80.25,-125 80.25,-125 86.25,-125 92.25,-131 92.25,-137 92.25,-137 92.25,-154.75 92.25,-154.75 92.25,-160.75 86.25,-166.75 80.25,-166.75"/>
+<text text-anchor="middle" x="65.25" y="-153.25" font-family="Helvetica,sans-Serif" font-size="10.00">op&#45;003</text>
+<text text-anchor="middle" x="65.25" y="-142" font-family="Helvetica,sans-Serif" font-size="10.00">add</text>
+<text text-anchor="middle" x="65.25" y="-130.75" font-family="Helvetica,sans-Serif" font-size="10.00">tasks: 4</text>
+</a>
+</g>
+</g>
+<!-- array&#45;001&#45;&gt;op&#45;003 -->
+<g id="edge2" class="edge">
+<title>array&#45;001&#45;&gt;op&#45;003</title>
+<path fill="none" stroke="black" d="M37.02,-202.48C40.85,-194.94 45.45,-185.87 49.82,-177.26"/>
+<polygon fill="black" stroke="black" points="52.88,-178.97 54.28,-168.47 46.64,-175.8 52.88,-178.97"/>
+</g>
+<!-- op&#45;002 -->
+<g id="node3" class="node">
+<title>op&#45;002</title>
+<g id="a_node3"><a xlink:title="name: op&#45;002&#10;op: asarray&#10;calls: &lt;module&gt; &#45;&gt; asarray&#10;line: 1 in &lt;module&gt;">
+<path fill="none" stroke="black" d="M118.25,-310.75C118.25,-310.75 88.25,-310.75 88.25,-310.75 82.25,-310.75 76.25,-304.75 76.25,-298.75 76.25,-298.75 76.25,-286.75 76.25,-286.75 76.25,-280.75 82.25,-274.75 88.25,-274.75 88.25,-274.75 118.25,-274.75 118.25,-274.75 124.25,-274.75 130.25,-280.75 130.25,-286.75 130.25,-286.75 130.25,-298.75 130.25,-298.75 130.25,-304.75 124.25,-310.75 118.25,-310.75"/>
+<text text-anchor="middle" x="103.25" y="-294.5" font-family="Helvetica,sans-Serif" font-size="10.00">op&#45;002</text>
+<text text-anchor="middle" x="103.25" y="-283.25" font-family="Helvetica,sans-Serif" font-size="10.00">asarray</text>
+</a>
+</g>
+</g>
+<!-- array&#45;002 -->
+<g id="node4" class="node">
+<title>array&#45;002</title>
+<g id="a_node4"><a xlink:title="name: array&#45;002&#10;variable: b&#10;shape: (3, 3)&#10;chunks: (2, 2)&#10;dtype: int64&#10;chunk memory: 32 bytes">
+<polygon fill="none" stroke="black" points="131.5,-238.75 75,-238.75 75,-202.75 131.5,-202.75 131.5,-238.75"/>
+<text text-anchor="middle" x="103.25" y="-222.5" font-family="Helvetica,sans-Serif" font-size="10.00">array&#45;002</text>
+<text text-anchor="middle" x="103.25" y="-211.25" font-family="Helvetica,sans-Serif" font-size="10.00">b</text>
+</a>
+</g>
+</g>
+<!-- op&#45;002&#45;&gt;array&#45;002 -->
+<g id="edge3" class="edge">
+<title>op&#45;002&#45;&gt;array&#45;002</title>
+<path fill="none" stroke="black" d="M103.25,-274.45C103.25,-267.16 103.25,-258.48 103.25,-250.29"/>
+<polygon fill="black" stroke="black" points="106.75,-250.37 103.25,-240.37 99.75,-250.37 106.75,-250.37"/>
+</g>
+<!-- array&#45;002&#45;&gt;op&#45;003 -->
+<g id="edge4" class="edge">
+<title>array&#45;002&#45;&gt;op&#45;003</title>
+<path fill="none" stroke="black" d="M94.24,-202.48C90.31,-194.94 85.58,-185.87 81.09,-177.26"/>
+<polygon fill="black" stroke="black" points="84.24,-175.71 76.51,-168.47 78.03,-178.95 84.24,-175.71"/>
+</g>
+<!-- array&#45;003 -->
+<g id="node6" class="node">
+<title>array&#45;003</title>
+<g id="a_node6"><a xlink:title="name: array&#45;003&#10;variable: c&#10;shape: (3, 3)&#10;chunks: (2, 2)&#10;dtype: int64&#10;chunk memory: 32 bytes&#10;nbytes: 72 bytes">
+<polygon fill="#ffd8b1" stroke="black" points="93.5,-89 37,-89 37,-53 93.5,-53 93.5,-89"/>
+<text text-anchor="middle" x="65.25" y="-72.75" font-family="Helvetica,sans-Serif" font-size="10.00">array&#45;003</text>
+<text text-anchor="middle" x="65.25" y="-61.5" font-family="Helvetica,sans-Serif" font-size="10.00">c</text>
+</a>
+</g>
+</g>
+<!-- op&#45;003&#45;&gt;array&#45;003 -->
+<g id="edge5" class="edge">
+<title>op&#45;003&#45;&gt;array&#45;003</title>
+<path fill="none" stroke="black" d="M65.25,-124.58C65.25,-117.19 65.25,-108.7 65.25,-100.73"/>
+<polygon fill="black" stroke="black" points="68.75,-100.74 65.25,-90.74 61.75,-100.74 68.75,-100.74"/>
+</g>
+<!-- create&#45;arrays -->
+<g id="node7" class="node">
+<title>create&#45;arrays</title>
+<g id="a_node7"><a xlink:title="name: create&#45;arrays&#10;op: create&#45;arrays&#10;projected memory: 100.0 MB&#10;tasks: 1">
+<path fill="none" stroke="black" d="M209.75,-310.75C209.75,-310.75 160.75,-310.75 160.75,-310.75 154.75,-310.75 148.75,-304.75 148.75,-298.75 148.75,-298.75 148.75,-286.75 148.75,-286.75 148.75,-280.75 154.75,-274.75 160.75,-274.75 160.75,-274.75 209.75,-274.75 209.75,-274.75 215.75,-274.75 221.75,-280.75 221.75,-286.75 221.75,-286.75 221.75,-298.75 221.75,-298.75 221.75,-304.75 215.75,-310.75 209.75,-310.75"/>
+<text text-anchor="middle" x="185.25" y="-294.5" font-family="Helvetica,sans-Serif" font-size="10.00">create&#45;arrays</text>
+<text text-anchor="middle" x="185.25" y="-283.25" font-family="Helvetica,sans-Serif" font-size="10.00">tasks: 1</text>
+</a>
+</g>
+</g>
+<!-- arrays -->
+<g id="node8" class="node">
+<title>arrays</title>
+<g id="a_node8"><a xlink:title="name: arrays" target="None">
+<polygon fill="none" stroke="black" points="212.25,-238.75 158.25,-238.75 158.25,-202.75 212.25,-202.75 212.25,-238.75"/>
+<text text-anchor="middle" x="185.25" y="-216.88" font-family="Helvetica,sans-Serif" font-size="10.00">arrays</text>
+</a>
+</g>
+</g>
+<!-- create&#45;arrays&#45;&gt;arrays -->
+<g id="edge6" class="edge">
+<title>create&#45;arrays&#45;&gt;arrays</title>
+<path fill="none" stroke="black" d="M185.25,-274.45C185.25,-267.16 185.25,-258.48 185.25,-250.29"/>
+<polygon fill="black" stroke="black" points="188.75,-250.37 185.25,-240.37 181.75,-250.37 188.75,-250.37"/>
+</g>
+</g>
+</svg>
diff --git a/docs/user-guide/diagnostics.md b/docs/user-guide/diagnostics.md
@@ -0,0 +1,66 @@
+# Diagnostics
+
+Cubed provides a variety of tools to understand a computation before running it, to monitor its progress while running, and to view performance statistics after it has completed.
+
+To use these features ensure that the optional dependencies for diagnostics have been installed:
+
+```shell
+python -m pip install "cubed[diagnostics]"
+```
+
+## Visualize the computation plan
+
+Before running a computation, Cubed will create an internal plan that it uses to compute the output arrays.
+
+The plan is a directed acyclic graph (DAG), and it can be useful to visualize it to see the number of steps involved in your computation, the number of tasks in each step (and overall), and the amount of intermediate data written out.
+
+The {py:meth}`Array.visualize() <cubed.Array.visualize()>` method on an array creates an image of the DAG. By default it is saved in a file called *cubed.svg* in the current working directory, but the filename and format can be changed if needed. If running in a Jupyter notebook the image will be rendered in the notebook.
+
+If you are computing multiple arrays at once, then there is a {py:func}`visualize <cubed.visualize>` function that takes multiple array arguments.
+
+This example shows a tiny computation and the resulting plan:
+
+```python
+import cubed.array_api as xp
+import cubed.random
+
+a = xp.asarray([[1, 2, 3], [4, 5, 6], [7, 8, 9]], chunks=(2, 2))
+b = xp.asarray([[1, 2, 3], [4, 5, 6], [7, 8, 9]], chunks=(2, 2))
+c = xp.add(a, b)
+
+c.visualize()
+```
+
+![Cubed visualization of a tiny computation](../images/cubed-add.svg)
+
+There are two type of nodes in the plan. Boxes with rounded corners are operations, while boxes with square corners are arrays.
+
+In this case there are three operations (labelled `op-001`, `op-002`, and `op-003`), which produce the three arrays `a`, `b`, and `c`. (There is always an additional operation called `create-arrays`, shown on the right, which Cubed creates automatically.)
+
+Array `c` is coloured orange, which means it is materialized as a Zarr array. Arrays `a` and `b` do not need to be materialized as Zarr arrays since they are small constant arrays that are passed to the workers running the tasks.
+
+Similarly, the operation that produces `c` is shown in a lilac colour to signify that it runs tasks to produce the output. Operations `op-001` and `op-002` don't run any tasks since `a` and `b` are just small constant arrays.
+
+## Progress bar
+
+You can display a progress bar to track your computation by passing callbacks to {py:meth}`compute() <cubed.Array.compute()>`:
+
+```ipython
+>>> from cubed.diagnostics.rich import RichProgressBar
+>>> progress = RichProgressBar()
+>>> c.compute(callbacks=[progress])  # c is the array from above
+  create-arrays 1/1 ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 100.0% 0:00:00
+  op-003 add    4/4 ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 100.0% 0:00:00
+```
+
+This will work in Jupyter notebooks, and for all executors.
+
+You can also pass callbacks to functions that call `compute`, such as {py:func}`store <cubed.store>` or {py:func}`to_zarr <cubed.to_zarr>`.
+
+## History and timeline visualization
+
+The history and timeline visualization callbacks can be used to find out how long tasks took to run, and how much memory they used.
+
+The timeline visualization is useful to determine how much time was spent in worker startup, as well as how much stragglers affected the overall time of the computation. (Ideally, we want vertical lines on this plot, which would represent perfect horizontal scaling.)
+
+See the [examples](https://github.com/cubed-dev/cubed/blob/main/examples/README.md) for more information about how to use them.
diff --git a/docs/user-guide/index.md b/docs/user-guide/index.md
@@ -11,4 +11,5 @@ storage
 memory
 reliability
 scaling
+diagnostics
 ```
diff --git a/docs/user-guide/scaling.md b/docs/user-guide/scaling.md
@@ -78,20 +78,7 @@ Different cloud providers' serverless offerings may perform differently. For exa
 
 ## Diagnosing Performance
 
-To understand how your computation could perform better you first need to diagnose the source of any problems.
-
-### Optimized Plan
-
-Use {py:meth}`Plan.visualize() <cubed.Plan.visualize()>` to view the optimized plan. This allows you to see the number of steps involved in your calculation, the number of tasks in each step, and overall.
-
-### History Callback
-
-The history callback function can help determine how much time was spent in worker startup, as well as how much stragglers affected the overall speed.
-
-### Timeline Visualization Callback
-
-A timeline visualization callback can provide a visual representation of the above points. Ideally, we want vertical lines on this plot, which would represent perfect horizontal scaling.
-
+See <project:diagnostics.md>.
 
 ## Tips