diff --git a/docs/images/optimization_map_fusion.svg b/docs/images/optimization_map_fusion.svg
new file mode 100644
index 00000000..fb8a03db
--- /dev/null
+++ b/docs/images/optimization_map_fusion.svg
@@ -0,0 +1,100 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN"
+ "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
+<!-- Generated by graphviz version 2.49.3 (20211023.0002)
+ -->
+<!-- Pages: 1 -->
+<svg width="163pt" height="317pt"
+ viewBox="0.00 0.00 163.00 317.00" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink">
+<g id="graph0" class="graph" transform="scale(1 1) rotate(0) translate(4 313)">
+<polygon fill="white" stroke="transparent" points="-4,4 -4,-313 159,-313 159,4 -4,4"/>
+<text text-anchor="start" x="8" y="-40" font-family="Times,serif" font-size="10.00">num tasks: 5</text>
+<text text-anchor="start" x="8" y="-29" font-family="Times,serif" font-size="10.00">max projected memory: 100.0 MB</text>
+<text text-anchor="start" x="8" y="-18" font-family="Times,serif" font-size="10.00">total nbytes: 36 bytes</text>
+<text text-anchor="start" x="8" y="-7" font-family="Times,serif" font-size="10.00">optimized: True</text>
+<!-- op&#45;001 -->
+<g id="node1" class="node">
+<title>op&#45;001</title>
+<g id="a_node1"><a xlink:title="name: op&#45;001&#10;op: asarray&#10;calls: &lt;module&gt; &#45;&gt; asarray&#10;line: 1 in &lt;module&gt;">
+<path fill="none" stroke="black" d="M47,-309C47,-309 17,-309 17,-309 11,-309 5,-303 5,-297 5,-297 5,-285 5,-285 5,-279 11,-273 17,-273 17,-273 47,-273 47,-273 53,-273 59,-279 59,-285 59,-285 59,-297 59,-297 59,-303 53,-309 47,-309"/>
+<text text-anchor="middle" x="32" y="-294" font-family="Helvetica,sans-Serif" font-size="10.00">op&#45;001</text>
+<text text-anchor="middle" x="32" y="-283" font-family="Helvetica,sans-Serif" font-size="10.00">asarray</text>
+</a>
+</g>
+</g>
+<!-- array&#45;001 -->
+<g id="node2" class="node">
+<title>array&#45;001</title>
+<g id="a_node2"><a xlink:title="name: array&#45;001&#10;variable: a&#10;shape: (3, 3)&#10;chunks: (2, 2)&#10;dtype: int64&#10;chunk memory: 32 bytes">
+<polygon fill="none" stroke="black" points="61.5,-237 2.5,-237 2.5,-201 61.5,-201 61.5,-237"/>
+<text text-anchor="middle" x="32" y="-222" font-family="Helvetica,sans-Serif" font-size="10.00">array&#45;001</text>
+<text text-anchor="middle" x="32" y="-211" font-family="Helvetica,sans-Serif" font-size="10.00">a</text>
+</a>
+</g>
+</g>
+<!-- op&#45;001&#45;&gt;array&#45;001 -->
+<g id="edge1" class="edge">
+<title>op&#45;001&#45;&gt;array&#45;001</title>
+<path fill="none" stroke="black" d="M32,-272.7C32,-264.98 32,-255.71 32,-247.11"/>
+<polygon fill="black" stroke="black" points="35.5,-247.1 32,-237.1 28.5,-247.1 35.5,-247.1"/>
+</g>
+<!-- op&#45;003 -->
+<g id="node3" class="node">
+<title>op&#45;003</title>
+<g id="a_node3"><a xlink:title="name: op&#45;003&#10;op: blockwise&#10;projected memory: 100.0 MB&#10;tasks: 4&#10;num input blocks: (1,)&#10;calls: &lt;module&gt; &#45;&gt; astype &#45;&gt; map_blocks &#45;&gt; _map_blocks &#45;&gt; blockwise&#10;line: 1 in &lt;module&gt;">
+<path fill="#dcbeff" stroke="black" d="M47,-165C47,-165 17,-165 17,-165 11,-165 5,-159 5,-153 5,-153 5,-136 5,-136 5,-130 11,-124 17,-124 17,-124 47,-124 47,-124 53,-124 59,-130 59,-136 59,-136 59,-153 59,-153 59,-159 53,-165 47,-165"/>
+<text text-anchor="middle" x="32" y="-153" font-family="Helvetica,sans-Serif" font-size="10.00">op&#45;003</text>
+<text text-anchor="middle" x="32" y="-142" font-family="Helvetica,sans-Serif" font-size="10.00">astype</text>
+<text text-anchor="middle" x="32" y="-131" font-family="Helvetica,sans-Serif" font-size="10.00">tasks: 4</text>
+</a>
+</g>
+</g>
+<!-- array&#45;001&#45;&gt;op&#45;003 -->
+<g id="edge2" class="edge">
+<title>array&#45;001&#45;&gt;op&#45;003</title>
+<path fill="none" stroke="black" d="M32,-200.82C32,-193.2 32,-184 32,-175.32"/>
+<polygon fill="black" stroke="black" points="35.5,-175.12 32,-165.12 28.5,-175.12 35.5,-175.12"/>
+</g>
+<!-- array&#45;003 -->
+<g id="node4" class="node">
+<title>array&#45;003</title>
+<g id="a_node4"><a xlink:title="name: array&#45;003&#10;variable: c&#10;shape: (3, 3)&#10;chunks: (2, 2)&#10;dtype: float32&#10;chunk memory: 16 bytes&#10;nbytes: 36 bytes">
+<polygon fill="#ffd8b1" stroke="black" points="61.5,-88 2.5,-88 2.5,-52 61.5,-52 61.5,-88"/>
+<text text-anchor="middle" x="32" y="-73" font-family="Helvetica,sans-Serif" font-size="10.00">array&#45;003</text>
+<text text-anchor="middle" x="32" y="-62" font-family="Helvetica,sans-Serif" font-size="10.00">c</text>
+</a>
+</g>
+</g>
+<!-- op&#45;003&#45;&gt;array&#45;003 -->
+<g id="edge3" class="edge">
+<title>op&#45;003&#45;&gt;array&#45;003</title>
+<path fill="none" stroke="black" d="M32,-123.69C32,-115.91 32,-106.84 32,-98.45"/>
+<polygon fill="black" stroke="black" points="35.5,-98.32 32,-88.32 28.5,-98.32 35.5,-98.32"/>
+</g>
+<!-- create&#45;arrays -->
+<g id="node5" class="node">
+<title>create&#45;arrays</title>
+<g id="a_node5"><a xlink:title="name: create&#45;arrays&#10;op: create&#45;arrays&#10;projected memory: 100.0 MB&#10;tasks: 1">
+<path fill="none" stroke="black" d="M140.5,-309C140.5,-309 89.5,-309 89.5,-309 83.5,-309 77.5,-303 77.5,-297 77.5,-297 77.5,-285 77.5,-285 77.5,-279 83.5,-273 89.5,-273 89.5,-273 140.5,-273 140.5,-273 146.5,-273 152.5,-279 152.5,-285 152.5,-285 152.5,-297 152.5,-297 152.5,-303 146.5,-309 140.5,-309"/>
+<text text-anchor="middle" x="115" y="-294" font-family="Helvetica,sans-Serif" font-size="10.00">create&#45;arrays</text>
+<text text-anchor="middle" x="115" y="-283" font-family="Helvetica,sans-Serif" font-size="10.00">tasks: 1</text>
+</a>
+</g>
+</g>
+<!-- arrays -->
+<g id="node6" class="node">
+<title>arrays</title>
+<g id="a_node6"><a xlink:title="name: arrays" target="None">
+<polygon fill="none" stroke="black" points="142,-237 88,-237 88,-201 142,-201 142,-237"/>
+<text text-anchor="middle" x="115" y="-216.5" font-family="Helvetica,sans-Serif" font-size="10.00">arrays</text>
+</a>
+</g>
+</g>
+<!-- create&#45;arrays&#45;&gt;arrays -->
+<g id="edge4" class="edge">
+<title>create&#45;arrays&#45;&gt;arrays</title>
+<path fill="none" stroke="black" d="M115,-272.7C115,-264.98 115,-255.71 115,-247.11"/>
+<polygon fill="black" stroke="black" points="118.5,-247.1 115,-237.1 111.5,-247.1 118.5,-247.1"/>
+</g>
+</g>
+</svg>
diff --git a/docs/images/optimization_multiple_inputs.svg b/docs/images/optimization_multiple_inputs.svg
new file mode 100644
index 00000000..b0da3e21
--- /dev/null
+++ b/docs/images/optimization_multiple_inputs.svg
@@ -0,0 +1,164 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN"
+ "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
+<!-- Generated by graphviz version 10.0.1 (20240210.2158)
+ -->
+<!-- Pages: 1 -->
+<svg width="305pt" height="319pt"
+ viewBox="0.00 0.00 304.75 318.75" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink">
+<g id="graph0" class="graph" transform="scale(1 1) rotate(0) translate(4 314.75)">
+<polygon fill="white" stroke="none" points="-4,4 -4,-314.75 300.75,-314.75 300.75,4 -4,4"/>
+<text text-anchor="start" x="8" y="-39.5" font-family="Times,serif" font-size="10.00">num tasks: 5</text>
+<text text-anchor="start" x="8" y="-28.25" font-family="Times,serif" font-size="10.00">max projected memory: 100.0 MB</text>
+<text text-anchor="start" x="8" y="-17" font-family="Times,serif" font-size="10.00">total nbytes written: 72 bytes</text>
+<text text-anchor="start" x="8" y="-5.75" font-family="Times,serif" font-size="10.00">optimized: True</text>
+<!-- op&#45;004 -->
+<g id="node1" class="node">
+<title>op&#45;004</title>
+<g id="a_node1"><a xlink:title="name: op&#45;004&#10;op: full&#10;calls: &lt;module&gt; &#45;&gt; ones &#45;&gt; full&#10;line: 1 in &lt;module&gt;">
+<path fill="none" stroke="black" d="M43.25,-310.75C43.25,-310.75 13.25,-310.75 13.25,-310.75 7.25,-310.75 1.25,-304.75 1.25,-298.75 1.25,-298.75 1.25,-286.75 1.25,-286.75 1.25,-280.75 7.25,-274.75 13.25,-274.75 13.25,-274.75 43.25,-274.75 43.25,-274.75 49.25,-274.75 55.25,-280.75 55.25,-286.75 55.25,-286.75 55.25,-298.75 55.25,-298.75 55.25,-304.75 49.25,-310.75 43.25,-310.75"/>
+<text text-anchor="middle" x="28.25" y="-294.5" font-family="Helvetica,sans-Serif" font-size="10.00">op&#45;004</text>
+<text text-anchor="middle" x="28.25" y="-283.25" font-family="Helvetica,sans-Serif" font-size="10.00">ones</text>
+</a>
+</g>
+</g>
+<!-- array&#45;004 -->
+<g id="node2" class="node">
+<title>array&#45;004</title>
+<g id="a_node2"><a xlink:title="name: array&#45;004&#10;variable: a&#10;shape: (3, 3)&#10;chunks: (2, 2)&#10;dtype: float64&#10;chunk memory: 8 bytes">
+<polygon fill="none" stroke="black" points="56.5,-238.75 0,-238.75 0,-202.75 56.5,-202.75 56.5,-238.75"/>
+<text text-anchor="middle" x="28.25" y="-222.5" font-family="Helvetica,sans-Serif" font-size="10.00">array&#45;004</text>
+<text text-anchor="middle" x="28.25" y="-211.25" font-family="Helvetica,sans-Serif" font-size="10.00">a</text>
+</a>
+</g>
+</g>
+<!-- op&#45;004&#45;&gt;array&#45;004 -->
+<g id="edge1" class="edge">
+<title>op&#45;004&#45;&gt;array&#45;004</title>
+<path fill="none" stroke="black" d="M28.25,-274.45C28.25,-267.16 28.25,-258.48 28.25,-250.29"/>
+<polygon fill="black" stroke="black" points="31.75,-250.37 28.25,-240.37 24.75,-250.37 31.75,-250.37"/>
+</g>
+<!-- op&#45;008 -->
+<g id="node7" class="node">
+<title>op&#45;008</title>
+<g id="a_node7"><a xlink:title="name: op&#45;008&#10;op: blockwise&#10;projected memory: 100.0 MB&#10;tasks: 4&#10;num input blocks: (1, 1, 1)&#10;calls: &lt;module&gt; &#45;&gt; add &#45;&gt; elemwise &#45;&gt; blockwise&#10;line: 1 in &lt;module&gt;">
+<path fill="#dcbeff" stroke="black" d="M118.25,-166.75C118.25,-166.75 88.25,-166.75 88.25,-166.75 82.25,-166.75 76.25,-160.75 76.25,-154.75 76.25,-154.75 76.25,-137 76.25,-137 76.25,-131 82.25,-125 88.25,-125 88.25,-125 118.25,-125 118.25,-125 124.25,-125 130.25,-131 130.25,-137 130.25,-137 130.25,-154.75 130.25,-154.75 130.25,-160.75 124.25,-166.75 118.25,-166.75"/>
+<text text-anchor="middle" x="103.25" y="-153.25" font-family="Helvetica,sans-Serif" font-size="10.00">op&#45;008</text>
+<text text-anchor="middle" x="103.25" y="-142" font-family="Helvetica,sans-Serif" font-size="10.00">add</text>
+<text text-anchor="middle" x="103.25" y="-130.75" font-family="Helvetica,sans-Serif" font-size="10.00">tasks: 4</text>
+</a>
+</g>
+</g>
+<!-- array&#45;004&#45;&gt;op&#45;008 -->
+<g id="edge2" class="edge">
+<title>array&#45;004&#45;&gt;op&#45;008</title>
+<path fill="none" stroke="black" d="M46.02,-202.48C54.47,-194.28 64.77,-184.26 74.3,-175"/>
+<polygon fill="black" stroke="black" points="76.59,-177.66 81.33,-168.18 71.71,-172.64 76.59,-177.66"/>
+</g>
+<!-- op&#45;005 -->
+<g id="node3" class="node">
+<title>op&#45;005</title>
+<g id="a_node3"><a xlink:title="name: op&#45;005&#10;op: full&#10;calls: &lt;module&gt; &#45;&gt; ones &#45;&gt; full&#10;line: 1 in &lt;module&gt;">
+<path fill="none" stroke="black" d="M118.25,-310.75C118.25,-310.75 88.25,-310.75 88.25,-310.75 82.25,-310.75 76.25,-304.75 76.25,-298.75 76.25,-298.75 76.25,-286.75 76.25,-286.75 76.25,-280.75 82.25,-274.75 88.25,-274.75 88.25,-274.75 118.25,-274.75 118.25,-274.75 124.25,-274.75 130.25,-280.75 130.25,-286.75 130.25,-286.75 130.25,-298.75 130.25,-298.75 130.25,-304.75 124.25,-310.75 118.25,-310.75"/>
+<text text-anchor="middle" x="103.25" y="-294.5" font-family="Helvetica,sans-Serif" font-size="10.00">op&#45;005</text>
+<text text-anchor="middle" x="103.25" y="-283.25" font-family="Helvetica,sans-Serif" font-size="10.00">ones</text>
+</a>
+</g>
+</g>
+<!-- array&#45;005 -->
+<g id="node4" class="node">
+<title>array&#45;005</title>
+<g id="a_node4"><a xlink:title="name: array&#45;005&#10;variable: b&#10;shape: (3, 3)&#10;chunks: (2, 2)&#10;dtype: float64&#10;chunk memory: 8 bytes">
+<polygon fill="none" stroke="black" points="131.5,-238.75 75,-238.75 75,-202.75 131.5,-202.75 131.5,-238.75"/>
+<text text-anchor="middle" x="103.25" y="-222.5" font-family="Helvetica,sans-Serif" font-size="10.00">array&#45;005</text>
+<text text-anchor="middle" x="103.25" y="-211.25" font-family="Helvetica,sans-Serif" font-size="10.00">b</text>
+</a>
+</g>
+</g>
+<!-- op&#45;005&#45;&gt;array&#45;005 -->
+<g id="edge3" class="edge">
+<title>op&#45;005&#45;&gt;array&#45;005</title>
+<path fill="none" stroke="black" d="M103.25,-274.45C103.25,-267.16 103.25,-258.48 103.25,-250.29"/>
+<polygon fill="black" stroke="black" points="106.75,-250.37 103.25,-240.37 99.75,-250.37 106.75,-250.37"/>
+</g>
+<!-- array&#45;005&#45;&gt;op&#45;008 -->
+<g id="edge4" class="edge">
+<title>array&#45;005&#45;&gt;op&#45;008</title>
+<path fill="none" stroke="black" d="M103.25,-202.48C103.25,-195.27 103.25,-186.66 103.25,-178.4"/>
+<polygon fill="black" stroke="black" points="106.75,-178.64 103.25,-168.64 99.75,-178.64 106.75,-178.64"/>
+</g>
+<!-- op&#45;006 -->
+<g id="node5" class="node">
+<title>op&#45;006</title>
+<g id="a_node5"><a xlink:title="name: op&#45;006&#10;op: full&#10;calls: &lt;module&gt; &#45;&gt; ones &#45;&gt; full&#10;line: 1 in &lt;module&gt;">
+<path fill="none" stroke="black" d="M193.25,-310.75C193.25,-310.75 163.25,-310.75 163.25,-310.75 157.25,-310.75 151.25,-304.75 151.25,-298.75 151.25,-298.75 151.25,-286.75 151.25,-286.75 151.25,-280.75 157.25,-274.75 163.25,-274.75 163.25,-274.75 193.25,-274.75 193.25,-274.75 199.25,-274.75 205.25,-280.75 205.25,-286.75 205.25,-286.75 205.25,-298.75 205.25,-298.75 205.25,-304.75 199.25,-310.75 193.25,-310.75"/>
+<text text-anchor="middle" x="178.25" y="-294.5" font-family="Helvetica,sans-Serif" font-size="10.00">op&#45;006</text>
+<text text-anchor="middle" x="178.25" y="-283.25" font-family="Helvetica,sans-Serif" font-size="10.00">ones</text>
+</a>
+</g>
+</g>
+<!-- array&#45;006 -->
+<g id="node6" class="node">
+<title>array&#45;006</title>
+<g id="a_node6"><a xlink:title="name: array&#45;006&#10;variable: c&#10;shape: (3, 3)&#10;chunks: (2, 2)&#10;dtype: float64&#10;chunk memory: 8 bytes">
+<polygon fill="none" stroke="black" points="206.5,-238.75 150,-238.75 150,-202.75 206.5,-202.75 206.5,-238.75"/>
+<text text-anchor="middle" x="178.25" y="-222.5" font-family="Helvetica,sans-Serif" font-size="10.00">array&#45;006</text>
+<text text-anchor="middle" x="178.25" y="-211.25" font-family="Helvetica,sans-Serif" font-size="10.00">c</text>
+</a>
+</g>
+</g>
+<!-- op&#45;006&#45;&gt;array&#45;006 -->
+<g id="edge5" class="edge">
+<title>op&#45;006&#45;&gt;array&#45;006</title>
+<path fill="none" stroke="black" d="M178.25,-274.45C178.25,-267.16 178.25,-258.48 178.25,-250.29"/>
+<polygon fill="black" stroke="black" points="181.75,-250.37 178.25,-240.37 174.75,-250.37 181.75,-250.37"/>
+</g>
+<!-- array&#45;006&#45;&gt;op&#45;008 -->
+<g id="edge6" class="edge">
+<title>array&#45;006&#45;&gt;op&#45;008</title>
+<path fill="none" stroke="black" d="M160.48,-202.48C152.03,-194.28 141.73,-184.26 132.2,-175"/>
+<polygon fill="black" stroke="black" points="134.79,-172.64 125.17,-168.18 129.91,-177.66 134.79,-172.64"/>
+</g>
+<!-- array&#45;008 -->
+<g id="node8" class="node">
+<title>array&#45;008</title>
+<g id="a_node8"><a xlink:title="name: array&#45;008&#10;variable: e&#10;shape: (3, 3)&#10;chunks: (2, 2)&#10;dtype: float64&#10;chunk memory: 32 bytes&#10;nbytes: 72 bytes">
+<polygon fill="#ffd8b1" stroke="black" points="131.5,-89 75,-89 75,-53 131.5,-53 131.5,-89"/>
+<text text-anchor="middle" x="103.25" y="-72.75" font-family="Helvetica,sans-Serif" font-size="10.00">array&#45;008</text>
+<text text-anchor="middle" x="103.25" y="-61.5" font-family="Helvetica,sans-Serif" font-size="10.00">e</text>
+</a>
+</g>
+</g>
+<!-- op&#45;008&#45;&gt;array&#45;008 -->
+<g id="edge7" class="edge">
+<title>op&#45;008&#45;&gt;array&#45;008</title>
+<path fill="none" stroke="black" d="M103.25,-124.58C103.25,-117.19 103.25,-108.7 103.25,-100.73"/>
+<polygon fill="black" stroke="black" points="106.75,-100.74 103.25,-90.74 99.75,-100.74 106.75,-100.74"/>
+</g>
+<!-- create&#45;arrays -->
+<g id="node9" class="node">
+<title>create&#45;arrays</title>
+<g id="a_node9"><a xlink:title="name: create&#45;arrays&#10;op: create&#45;arrays&#10;projected memory: 100.0 MB&#10;tasks: 1">
+<path fill="none" stroke="black" d="M284.75,-310.75C284.75,-310.75 235.75,-310.75 235.75,-310.75 229.75,-310.75 223.75,-304.75 223.75,-298.75 223.75,-298.75 223.75,-286.75 223.75,-286.75 223.75,-280.75 229.75,-274.75 235.75,-274.75 235.75,-274.75 284.75,-274.75 284.75,-274.75 290.75,-274.75 296.75,-280.75 296.75,-286.75 296.75,-286.75 296.75,-298.75 296.75,-298.75 296.75,-304.75 290.75,-310.75 284.75,-310.75"/>
+<text text-anchor="middle" x="260.25" y="-294.5" font-family="Helvetica,sans-Serif" font-size="10.00">create&#45;arrays</text>
+<text text-anchor="middle" x="260.25" y="-283.25" font-family="Helvetica,sans-Serif" font-size="10.00">tasks: 1</text>
+</a>
+</g>
+</g>
+<!-- arrays -->
+<g id="node10" class="node">
+<title>arrays</title>
+<g id="a_node10"><a xlink:title="name: arrays" target="None">
+<polygon fill="none" stroke="black" points="287.25,-238.75 233.25,-238.75 233.25,-202.75 287.25,-202.75 287.25,-238.75"/>
+<text text-anchor="middle" x="260.25" y="-216.88" font-family="Helvetica,sans-Serif" font-size="10.00">arrays</text>
+</a>
+</g>
+</g>
+<!-- create&#45;arrays&#45;&gt;arrays -->
+<g id="edge8" class="edge">
+<title>create&#45;arrays&#45;&gt;arrays</title>
+<path fill="none" stroke="black" d="M260.25,-274.45C260.25,-267.16 260.25,-258.48 260.25,-250.29"/>
+<polygon fill="black" stroke="black" points="263.75,-250.37 260.25,-240.37 256.75,-250.37 263.75,-250.37"/>
+</g>
+</g>
+</svg>
diff --git a/docs/images/optimization_multiple_inputs_unoptimized.svg b/docs/images/optimization_multiple_inputs_unoptimized.svg
new file mode 100644
index 00000000..7eb2026e
--- /dev/null
+++ b/docs/images/optimization_multiple_inputs_unoptimized.svg
@@ -0,0 +1,197 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN"
+ "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
+<!-- Generated by graphviz version 10.0.1 (20240210.2158)
+ -->
+<!-- Pages: 1 -->
+<svg width="268pt" height="469pt"
+ viewBox="0.00 0.00 267.75 468.50" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink">
+<g id="graph0" class="graph" transform="scale(1 1) rotate(0) translate(4 464.5)">
+<polygon fill="white" stroke="none" points="-4,4 -4,-464.5 263.75,-464.5 263.75,4 -4,4"/>
+<text text-anchor="start" x="8" y="-39.5" font-family="Times,serif" font-size="10.00">num tasks: 10</text>
+<text text-anchor="start" x="8" y="-28.25" font-family="Times,serif" font-size="10.00">max projected memory: 100.0 MB</text>
+<text text-anchor="start" x="8" y="-17" font-family="Times,serif" font-size="10.00">total nbytes written: 144 bytes</text>
+<text text-anchor="start" x="8" y="-5.75" font-family="Times,serif" font-size="10.00">optimized: False</text>
+<!-- op&#45;004 -->
+<g id="node1" class="node">
+<title>op&#45;004</title>
+<g id="a_node1"><a xlink:title="name: op&#45;004&#10;op: full&#10;calls: &lt;module&gt; &#45;&gt; ones &#45;&gt; full&#10;line: 1 in &lt;module&gt;">
+<path fill="none" stroke="black" d="M43.25,-313.62C43.25,-313.62 13.25,-313.62 13.25,-313.62 7.25,-313.62 1.25,-307.62 1.25,-301.62 1.25,-301.62 1.25,-289.62 1.25,-289.62 1.25,-283.62 7.25,-277.62 13.25,-277.62 13.25,-277.62 43.25,-277.62 43.25,-277.62 49.25,-277.62 55.25,-283.62 55.25,-289.62 55.25,-289.62 55.25,-301.62 55.25,-301.62 55.25,-307.62 49.25,-313.62 43.25,-313.62"/>
+<text text-anchor="middle" x="28.25" y="-297.38" font-family="Helvetica,sans-Serif" font-size="10.00">op&#45;004</text>
+<text text-anchor="middle" x="28.25" y="-286.12" font-family="Helvetica,sans-Serif" font-size="10.00">ones</text>
+</a>
+</g>
+</g>
+<!-- array&#45;004 -->
+<g id="node2" class="node">
+<title>array&#45;004</title>
+<g id="a_node2"><a xlink:title="name: array&#45;004&#10;variable: a&#10;shape: (3, 3)&#10;chunks: (2, 2)&#10;dtype: float64&#10;chunk memory: 8 bytes">
+<polygon fill="none" stroke="black" points="56.5,-238.75 0,-238.75 0,-202.75 56.5,-202.75 56.5,-238.75"/>
+<text text-anchor="middle" x="28.25" y="-222.5" font-family="Helvetica,sans-Serif" font-size="10.00">array&#45;004</text>
+<text text-anchor="middle" x="28.25" y="-211.25" font-family="Helvetica,sans-Serif" font-size="10.00">a</text>
+</a>
+</g>
+</g>
+<!-- op&#45;004&#45;&gt;array&#45;004 -->
+<g id="edge1" class="edge">
+<title>op&#45;004&#45;&gt;array&#45;004</title>
+<path fill="none" stroke="black" d="M28.25,-277.35C28.25,-269.34 28.25,-259.59 28.25,-250.5"/>
+<polygon fill="black" stroke="black" points="31.75,-250.66 28.25,-240.66 24.75,-250.66 31.75,-250.66"/>
+</g>
+<!-- op&#45;008 -->
+<g id="node9" class="node">
+<title>op&#45;008</title>
+<g id="a_node9"><a xlink:title="name: op&#45;008&#10;op: blockwise&#10;projected memory: 100.0 MB&#10;tasks: 4&#10;num input blocks: (1, 1)&#10;calls: &lt;module&gt; &#45;&gt; add &#45;&gt; elemwise &#45;&gt; blockwise&#10;line: 1 in &lt;module&gt;">
+<path fill="#dcbeff" stroke="black" d="M80.25,-166.75C80.25,-166.75 50.25,-166.75 50.25,-166.75 44.25,-166.75 38.25,-160.75 38.25,-154.75 38.25,-154.75 38.25,-137 38.25,-137 38.25,-131 44.25,-125 50.25,-125 50.25,-125 80.25,-125 80.25,-125 86.25,-125 92.25,-131 92.25,-137 92.25,-137 92.25,-154.75 92.25,-154.75 92.25,-160.75 86.25,-166.75 80.25,-166.75"/>
+<text text-anchor="middle" x="65.25" y="-153.25" font-family="Helvetica,sans-Serif" font-size="10.00">op&#45;008</text>
+<text text-anchor="middle" x="65.25" y="-142" font-family="Helvetica,sans-Serif" font-size="10.00">add</text>
+<text text-anchor="middle" x="65.25" y="-130.75" font-family="Helvetica,sans-Serif" font-size="10.00">tasks: 4</text>
+</a>
+</g>
+</g>
+<!-- array&#45;004&#45;&gt;op&#45;008 -->
+<g id="edge2" class="edge">
+<title>array&#45;004&#45;&gt;op&#45;008</title>
+<path fill="none" stroke="black" d="M37.02,-202.48C40.85,-194.94 45.45,-185.87 49.82,-177.26"/>
+<polygon fill="black" stroke="black" points="52.88,-178.97 54.28,-168.47 46.64,-175.8 52.88,-178.97"/>
+</g>
+<!-- op&#45;005 -->
+<g id="node3" class="node">
+<title>op&#45;005</title>
+<g id="a_node3"><a xlink:title="name: op&#45;005&#10;op: full&#10;calls: &lt;module&gt; &#45;&gt; ones &#45;&gt; full&#10;line: 1 in &lt;module&gt;">
+<path fill="none" stroke="black" d="M81.25,-460.5C81.25,-460.5 51.25,-460.5 51.25,-460.5 45.25,-460.5 39.25,-454.5 39.25,-448.5 39.25,-448.5 39.25,-436.5 39.25,-436.5 39.25,-430.5 45.25,-424.5 51.25,-424.5 51.25,-424.5 81.25,-424.5 81.25,-424.5 87.25,-424.5 93.25,-430.5 93.25,-436.5 93.25,-436.5 93.25,-448.5 93.25,-448.5 93.25,-454.5 87.25,-460.5 81.25,-460.5"/>
+<text text-anchor="middle" x="66.25" y="-444.25" font-family="Helvetica,sans-Serif" font-size="10.00">op&#45;005</text>
+<text text-anchor="middle" x="66.25" y="-433" font-family="Helvetica,sans-Serif" font-size="10.00">ones</text>
+</a>
+</g>
+</g>
+<!-- array&#45;005 -->
+<g id="node4" class="node">
+<title>array&#45;005</title>
+<g id="a_node4"><a xlink:title="name: array&#45;005&#10;variable: b&#10;shape: (3, 3)&#10;chunks: (2, 2)&#10;dtype: float64&#10;chunk memory: 8 bytes">
+<polygon fill="none" stroke="black" points="94.5,-388.5 38,-388.5 38,-352.5 94.5,-352.5 94.5,-388.5"/>
+<text text-anchor="middle" x="66.25" y="-372.25" font-family="Helvetica,sans-Serif" font-size="10.00">array&#45;005</text>
+<text text-anchor="middle" x="66.25" y="-361" font-family="Helvetica,sans-Serif" font-size="10.00">b</text>
+</a>
+</g>
+</g>
+<!-- op&#45;005&#45;&gt;array&#45;005 -->
+<g id="edge3" class="edge">
+<title>op&#45;005&#45;&gt;array&#45;005</title>
+<path fill="none" stroke="black" d="M66.25,-424.2C66.25,-416.91 66.25,-408.23 66.25,-400.04"/>
+<polygon fill="black" stroke="black" points="69.75,-400.12 66.25,-390.12 62.75,-400.12 69.75,-400.12"/>
+</g>
+<!-- op&#45;007 -->
+<g id="node7" class="node">
+<title>op&#45;007</title>
+<g id="a_node7"><a xlink:title="name: op&#45;007&#10;op: blockwise&#10;projected memory: 100.0 MB&#10;tasks: 4&#10;num input blocks: (1, 1)&#10;calls: &lt;module&gt; &#45;&gt; add &#45;&gt; elemwise &#45;&gt; blockwise&#10;line: 1 in &lt;module&gt;">
+<path fill="#dcbeff" stroke="black" d="M118.25,-316.5C118.25,-316.5 88.25,-316.5 88.25,-316.5 82.25,-316.5 76.25,-310.5 76.25,-304.5 76.25,-304.5 76.25,-286.75 76.25,-286.75 76.25,-280.75 82.25,-274.75 88.25,-274.75 88.25,-274.75 118.25,-274.75 118.25,-274.75 124.25,-274.75 130.25,-280.75 130.25,-286.75 130.25,-286.75 130.25,-304.5 130.25,-304.5 130.25,-310.5 124.25,-316.5 118.25,-316.5"/>
+<text text-anchor="middle" x="103.25" y="-303" font-family="Helvetica,sans-Serif" font-size="10.00">op&#45;007</text>
+<text text-anchor="middle" x="103.25" y="-291.75" font-family="Helvetica,sans-Serif" font-size="10.00">add</text>
+<text text-anchor="middle" x="103.25" y="-280.5" font-family="Helvetica,sans-Serif" font-size="10.00">tasks: 4</text>
+</a>
+</g>
+</g>
+<!-- array&#45;005&#45;&gt;op&#45;007 -->
+<g id="edge4" class="edge">
+<title>array&#45;005&#45;&gt;op&#45;007</title>
+<path fill="none" stroke="black" d="M75.02,-352.23C78.85,-344.69 83.45,-335.62 87.82,-327.01"/>
+<polygon fill="black" stroke="black" points="90.88,-328.72 92.28,-318.22 84.64,-325.55 90.88,-328.72"/>
+</g>
+<!-- op&#45;006 -->
+<g id="node5" class="node">
+<title>op&#45;006</title>
+<g id="a_node5"><a xlink:title="name: op&#45;006&#10;op: full&#10;calls: &lt;module&gt; &#45;&gt; ones &#45;&gt; full&#10;line: 1 in &lt;module&gt;">
+<path fill="none" stroke="black" d="M156.25,-460.5C156.25,-460.5 126.25,-460.5 126.25,-460.5 120.25,-460.5 114.25,-454.5 114.25,-448.5 114.25,-448.5 114.25,-436.5 114.25,-436.5 114.25,-430.5 120.25,-424.5 126.25,-424.5 126.25,-424.5 156.25,-424.5 156.25,-424.5 162.25,-424.5 168.25,-430.5 168.25,-436.5 168.25,-436.5 168.25,-448.5 168.25,-448.5 168.25,-454.5 162.25,-460.5 156.25,-460.5"/>
+<text text-anchor="middle" x="141.25" y="-444.25" font-family="Helvetica,sans-Serif" font-size="10.00">op&#45;006</text>
+<text text-anchor="middle" x="141.25" y="-433" font-family="Helvetica,sans-Serif" font-size="10.00">ones</text>
+</a>
+</g>
+</g>
+<!-- array&#45;006 -->
+<g id="node6" class="node">
+<title>array&#45;006</title>
+<g id="a_node6"><a xlink:title="name: array&#45;006&#10;variable: c&#10;shape: (3, 3)&#10;chunks: (2, 2)&#10;dtype: float64&#10;chunk memory: 8 bytes">
+<polygon fill="none" stroke="black" points="169.5,-388.5 113,-388.5 113,-352.5 169.5,-352.5 169.5,-388.5"/>
+<text text-anchor="middle" x="141.25" y="-372.25" font-family="Helvetica,sans-Serif" font-size="10.00">array&#45;006</text>
+<text text-anchor="middle" x="141.25" y="-361" font-family="Helvetica,sans-Serif" font-size="10.00">c</text>
+</a>
+</g>
+</g>
+<!-- op&#45;006&#45;&gt;array&#45;006 -->
+<g id="edge5" class="edge">
+<title>op&#45;006&#45;&gt;array&#45;006</title>
+<path fill="none" stroke="black" d="M141.25,-424.2C141.25,-416.91 141.25,-408.23 141.25,-400.04"/>
+<polygon fill="black" stroke="black" points="144.75,-400.12 141.25,-390.12 137.75,-400.12 144.75,-400.12"/>
+</g>
+<!-- array&#45;006&#45;&gt;op&#45;007 -->
+<g id="edge6" class="edge">
+<title>array&#45;006&#45;&gt;op&#45;007</title>
+<path fill="none" stroke="black" d="M132.24,-352.23C128.31,-344.69 123.58,-335.62 119.09,-327.01"/>
+<polygon fill="black" stroke="black" points="122.24,-325.46 114.51,-318.22 116.03,-328.7 122.24,-325.46"/>
+</g>
+<!-- array&#45;007 -->
+<g id="node8" class="node">
+<title>array&#45;007</title>
+<g id="a_node8"><a xlink:title="name: array&#45;007&#10;variable: d&#10;shape: (3, 3)&#10;chunks: (2, 2)&#10;dtype: float64&#10;chunk memory: 32 bytes&#10;nbytes: 72 bytes">
+<polygon fill="#ffd8b1" stroke="black" points="131.5,-238.75 75,-238.75 75,-202.75 131.5,-202.75 131.5,-238.75"/>
+<text text-anchor="middle" x="103.25" y="-222.5" font-family="Helvetica,sans-Serif" font-size="10.00">array&#45;007</text>
+<text text-anchor="middle" x="103.25" y="-211.25" font-family="Helvetica,sans-Serif" font-size="10.00">d</text>
+</a>
+</g>
+</g>
+<!-- op&#45;007&#45;&gt;array&#45;007 -->
+<g id="edge7" class="edge">
+<title>op&#45;007&#45;&gt;array&#45;007</title>
+<path fill="none" stroke="black" d="M103.25,-274.33C103.25,-266.94 103.25,-258.45 103.25,-250.48"/>
+<polygon fill="black" stroke="black" points="106.75,-250.49 103.25,-240.49 99.75,-250.49 106.75,-250.49"/>
+</g>
+<!-- array&#45;007&#45;&gt;op&#45;008 -->
+<g id="edge8" class="edge">
+<title>array&#45;007&#45;&gt;op&#45;008</title>
+<path fill="none" stroke="black" d="M94.24,-202.48C90.31,-194.94 85.58,-185.87 81.09,-177.26"/>
+<polygon fill="black" stroke="black" points="84.24,-175.71 76.51,-168.47 78.03,-178.95 84.24,-175.71"/>
+</g>
+<!-- array&#45;008 -->
+<g id="node10" class="node">
+<title>array&#45;008</title>
+<g id="a_node10"><a xlink:title="name: array&#45;008&#10;variable: e&#10;shape: (3, 3)&#10;chunks: (2, 2)&#10;dtype: float64&#10;chunk memory: 32 bytes&#10;nbytes: 72 bytes">
+<polygon fill="#ffd8b1" stroke="black" points="93.5,-89 37,-89 37,-53 93.5,-53 93.5,-89"/>
+<text text-anchor="middle" x="65.25" y="-72.75" font-family="Helvetica,sans-Serif" font-size="10.00">array&#45;008</text>
+<text text-anchor="middle" x="65.25" y="-61.5" font-family="Helvetica,sans-Serif" font-size="10.00">e</text>
+</a>
+</g>
+</g>
+<!-- op&#45;008&#45;&gt;array&#45;008 -->
+<g id="edge9" class="edge">
+<title>op&#45;008&#45;&gt;array&#45;008</title>
+<path fill="none" stroke="black" d="M65.25,-124.58C65.25,-117.19 65.25,-108.7 65.25,-100.73"/>
+<polygon fill="black" stroke="black" points="68.75,-100.74 65.25,-90.74 61.75,-100.74 68.75,-100.74"/>
+</g>
+<!-- create&#45;arrays -->
+<g id="node11" class="node">
+<title>create&#45;arrays</title>
+<g id="a_node11"><a xlink:title="name: create&#45;arrays&#10;op: create&#45;arrays&#10;projected memory: 100.0 MB&#10;tasks: 2">
+<path fill="none" stroke="black" d="M247.75,-460.5C247.75,-460.5 198.75,-460.5 198.75,-460.5 192.75,-460.5 186.75,-454.5 186.75,-448.5 186.75,-448.5 186.75,-436.5 186.75,-436.5 186.75,-430.5 192.75,-424.5 198.75,-424.5 198.75,-424.5 247.75,-424.5 247.75,-424.5 253.75,-424.5 259.75,-430.5 259.75,-436.5 259.75,-436.5 259.75,-448.5 259.75,-448.5 259.75,-454.5 253.75,-460.5 247.75,-460.5"/>
+<text text-anchor="middle" x="223.25" y="-444.25" font-family="Helvetica,sans-Serif" font-size="10.00">create&#45;arrays</text>
+<text text-anchor="middle" x="223.25" y="-433" font-family="Helvetica,sans-Serif" font-size="10.00">tasks: 2</text>
+</a>
+</g>
+</g>
+<!-- arrays -->
+<g id="node12" class="node">
+<title>arrays</title>
+<g id="a_node12"><a xlink:title="name: arrays" target="None">
+<polygon fill="none" stroke="black" points="250.25,-388.5 196.25,-388.5 196.25,-352.5 250.25,-352.5 250.25,-388.5"/>
+<text text-anchor="middle" x="223.25" y="-366.62" font-family="Helvetica,sans-Serif" font-size="10.00">arrays</text>
+</a>
+</g>
+</g>
+<!-- create&#45;arrays&#45;&gt;arrays -->
+<g id="edge10" class="edge">
+<title>create&#45;arrays&#45;&gt;arrays</title>
+<path fill="none" stroke="black" d="M223.25,-424.2C223.25,-416.91 223.25,-408.23 223.25,-400.04"/>
+<polygon fill="black" stroke="black" points="226.75,-400.12 223.25,-390.12 219.75,-400.12 226.75,-400.12"/>
+</g>
+</g>
+</svg>
diff --git a/docs/images/optimization_turned_off.svg b/docs/images/optimization_turned_off.svg
new file mode 100644
index 00000000..3f83dae6
--- /dev/null
+++ b/docs/images/optimization_turned_off.svg
@@ -0,0 +1,133 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN"
+ "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
+<!-- Generated by graphviz version 2.49.3 (20211023.0002)
+ -->
+<!-- Pages: 1 -->
+<svg width="163pt" height="466pt"
+ viewBox="0.00 0.00 163.00 466.00" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink">
+<g id="graph0" class="graph" transform="scale(1 1) rotate(0) translate(4 462)">
+<polygon fill="white" stroke="transparent" points="-4,4 -4,-462 159,-462 159,4 -4,4"/>
+<text text-anchor="start" x="8" y="-40" font-family="Times,serif" font-size="10.00">num tasks: 10</text>
+<text text-anchor="start" x="8" y="-29" font-family="Times,serif" font-size="10.00">max projected memory: 100.0 MB</text>
+<text text-anchor="start" x="8" y="-18" font-family="Times,serif" font-size="10.00">total nbytes: 108 bytes</text>
+<text text-anchor="start" x="8" y="-7" font-family="Times,serif" font-size="10.00">optimized: False</text>
+<!-- op&#45;001 -->
+<g id="node1" class="node">
+<title>op&#45;001</title>
+<g id="a_node1"><a xlink:title="name: op&#45;001&#10;op: asarray&#10;calls: &lt;module&gt; &#45;&gt; asarray&#10;line: 1 in &lt;module&gt;">
+<path fill="none" stroke="black" d="M47,-458C47,-458 17,-458 17,-458 11,-458 5,-452 5,-446 5,-446 5,-434 5,-434 5,-428 11,-422 17,-422 17,-422 47,-422 47,-422 53,-422 59,-428 59,-434 59,-434 59,-446 59,-446 59,-452 53,-458 47,-458"/>
+<text text-anchor="middle" x="32" y="-443" font-family="Helvetica,sans-Serif" font-size="10.00">op&#45;001</text>
+<text text-anchor="middle" x="32" y="-432" font-family="Helvetica,sans-Serif" font-size="10.00">asarray</text>
+</a>
+</g>
+</g>
+<!-- array&#45;001 -->
+<g id="node2" class="node">
+<title>array&#45;001</title>
+<g id="a_node2"><a xlink:title="name: array&#45;001&#10;variable: a&#10;shape: (3, 3)&#10;chunks: (2, 2)&#10;dtype: int64&#10;chunk memory: 32 bytes">
+<polygon fill="none" stroke="black" points="61.5,-386 2.5,-386 2.5,-350 61.5,-350 61.5,-386"/>
+<text text-anchor="middle" x="32" y="-371" font-family="Helvetica,sans-Serif" font-size="10.00">array&#45;001</text>
+<text text-anchor="middle" x="32" y="-360" font-family="Helvetica,sans-Serif" font-size="10.00">a</text>
+</a>
+</g>
+</g>
+<!-- op&#45;001&#45;&gt;array&#45;001 -->
+<g id="edge1" class="edge">
+<title>op&#45;001&#45;&gt;array&#45;001</title>
+<path fill="none" stroke="black" d="M32,-421.7C32,-413.98 32,-404.71 32,-396.11"/>
+<polygon fill="black" stroke="black" points="35.5,-396.1 32,-386.1 28.5,-396.1 35.5,-396.1"/>
+</g>
+<!-- op&#45;002 -->
+<g id="node3" class="node">
+<title>op&#45;002</title>
+<g id="a_node3"><a xlink:title="name: op&#45;002&#10;op: blockwise&#10;projected memory: 100.0 MB&#10;tasks: 4&#10;num input blocks: (1,)&#10;calls: &lt;module&gt; &#45;&gt; negative &#45;&gt; elemwise &#45;&gt; blockwise&#10;line: 1 in &lt;module&gt;">
+<path fill="#dcbeff" stroke="black" d="M47,-314C47,-314 17,-314 17,-314 11,-314 5,-308 5,-302 5,-302 5,-285 5,-285 5,-279 11,-273 17,-273 17,-273 47,-273 47,-273 53,-273 59,-279 59,-285 59,-285 59,-302 59,-302 59,-308 53,-314 47,-314"/>
+<text text-anchor="middle" x="32" y="-302" font-family="Helvetica,sans-Serif" font-size="10.00">op&#45;002</text>
+<text text-anchor="middle" x="32" y="-291" font-family="Helvetica,sans-Serif" font-size="10.00">negative</text>
+<text text-anchor="middle" x="32" y="-280" font-family="Helvetica,sans-Serif" font-size="10.00">tasks: 4</text>
+</a>
+</g>
+</g>
+<!-- array&#45;001&#45;&gt;op&#45;002 -->
+<g id="edge2" class="edge">
+<title>array&#45;001&#45;&gt;op&#45;002</title>
+<path fill="none" stroke="black" d="M32,-349.82C32,-342.2 32,-333 32,-324.32"/>
+<polygon fill="black" stroke="black" points="35.5,-324.12 32,-314.12 28.5,-324.12 35.5,-324.12"/>
+</g>
+<!-- array&#45;002 -->
+<g id="node4" class="node">
+<title>array&#45;002</title>
+<g id="a_node4"><a xlink:title="name: array&#45;002&#10;variable: b&#10;shape: (3, 3)&#10;chunks: (2, 2)&#10;dtype: int64&#10;chunk memory: 32 bytes&#10;nbytes: 72 bytes">
+<polygon fill="#ffd8b1" stroke="black" points="61.5,-237 2.5,-237 2.5,-201 61.5,-201 61.5,-237"/>
+<text text-anchor="middle" x="32" y="-222" font-family="Helvetica,sans-Serif" font-size="10.00">array&#45;002</text>
+<text text-anchor="middle" x="32" y="-211" font-family="Helvetica,sans-Serif" font-size="10.00">b</text>
+</a>
+</g>
+</g>
+<!-- op&#45;002&#45;&gt;array&#45;002 -->
+<g id="edge3" class="edge">
+<title>op&#45;002&#45;&gt;array&#45;002</title>
+<path fill="none" stroke="black" d="M32,-272.69C32,-264.91 32,-255.84 32,-247.45"/>
+<polygon fill="black" stroke="black" points="35.5,-247.32 32,-237.32 28.5,-247.32 35.5,-247.32"/>
+</g>
+<!-- op&#45;003 -->
+<g id="node5" class="node">
+<title>op&#45;003</title>
+<g id="a_node5"><a xlink:title="name: op&#45;003&#10;op: blockwise&#10;projected memory: 100.0 MB&#10;tasks: 4&#10;num input blocks: (1,)&#10;calls: &lt;module&gt; &#45;&gt; astype &#45;&gt; map_blocks &#45;&gt; _map_blocks &#45;&gt; blockwise&#10;line: 1 in &lt;module&gt;">
+<path fill="#dcbeff" stroke="black" d="M47,-165C47,-165 17,-165 17,-165 11,-165 5,-159 5,-153 5,-153 5,-136 5,-136 5,-130 11,-124 17,-124 17,-124 47,-124 47,-124 53,-124 59,-130 59,-136 59,-136 59,-153 59,-153 59,-159 53,-165 47,-165"/>
+<text text-anchor="middle" x="32" y="-153" font-family="Helvetica,sans-Serif" font-size="10.00">op&#45;003</text>
+<text text-anchor="middle" x="32" y="-142" font-family="Helvetica,sans-Serif" font-size="10.00">astype</text>
+<text text-anchor="middle" x="32" y="-131" font-family="Helvetica,sans-Serif" font-size="10.00">tasks: 4</text>
+</a>
+</g>
+</g>
+<!-- array&#45;002&#45;&gt;op&#45;003 -->
+<g id="edge4" class="edge">
+<title>array&#45;002&#45;&gt;op&#45;003</title>
+<path fill="none" stroke="black" d="M32,-200.82C32,-193.2 32,-184 32,-175.32"/>
+<polygon fill="black" stroke="black" points="35.5,-175.12 32,-165.12 28.5,-175.12 35.5,-175.12"/>
+</g>
+<!-- array&#45;003 -->
+<g id="node6" class="node">
+<title>array&#45;003</title>
+<g id="a_node6"><a xlink:title="name: array&#45;003&#10;variable: c&#10;shape: (3, 3)&#10;chunks: (2, 2)&#10;dtype: float32&#10;chunk memory: 16 bytes&#10;nbytes: 36 bytes">
+<polygon fill="#ffd8b1" stroke="black" points="61.5,-88 2.5,-88 2.5,-52 61.5,-52 61.5,-88"/>
+<text text-anchor="middle" x="32" y="-73" font-family="Helvetica,sans-Serif" font-size="10.00">array&#45;003</text>
+<text text-anchor="middle" x="32" y="-62" font-family="Helvetica,sans-Serif" font-size="10.00">c</text>
+</a>
+</g>
+</g>
+<!-- op&#45;003&#45;&gt;array&#45;003 -->
+<g id="edge5" class="edge">
+<title>op&#45;003&#45;&gt;array&#45;003</title>
+<path fill="none" stroke="black" d="M32,-123.69C32,-115.91 32,-106.84 32,-98.45"/>
+<polygon fill="black" stroke="black" points="35.5,-98.32 32,-88.32 28.5,-98.32 35.5,-98.32"/>
+</g>
+<!-- create&#45;arrays -->
+<g id="node7" class="node">
+<title>create&#45;arrays</title>
+<g id="a_node7"><a xlink:title="name: create&#45;arrays&#10;op: create&#45;arrays&#10;projected memory: 100.0 MB&#10;tasks: 2">
+<path fill="none" stroke="black" d="M140.5,-458C140.5,-458 89.5,-458 89.5,-458 83.5,-458 77.5,-452 77.5,-446 77.5,-446 77.5,-434 77.5,-434 77.5,-428 83.5,-422 89.5,-422 89.5,-422 140.5,-422 140.5,-422 146.5,-422 152.5,-428 152.5,-434 152.5,-434 152.5,-446 152.5,-446 152.5,-452 146.5,-458 140.5,-458"/>
+<text text-anchor="middle" x="115" y="-443" font-family="Helvetica,sans-Serif" font-size="10.00">create&#45;arrays</text>
+<text text-anchor="middle" x="115" y="-432" font-family="Helvetica,sans-Serif" font-size="10.00">tasks: 2</text>
+</a>
+</g>
+</g>
+<!-- arrays -->
+<g id="node8" class="node">
+<title>arrays</title>
+<g id="a_node8"><a xlink:title="name: arrays" target="None">
+<polygon fill="none" stroke="black" points="142,-386 88,-386 88,-350 142,-350 142,-386"/>
+<text text-anchor="middle" x="115" y="-365.5" font-family="Helvetica,sans-Serif" font-size="10.00">arrays</text>
+</a>
+</g>
+</g>
+<!-- create&#45;arrays&#45;&gt;arrays -->
+<g id="edge6" class="edge">
+<title>create&#45;arrays&#45;&gt;arrays</title>
+<path fill="none" stroke="black" d="M115,-421.7C115,-413.98 115,-404.71 115,-396.11"/>
+<polygon fill="black" stroke="black" points="118.5,-396.1 115,-386.1 111.5,-396.1 118.5,-396.1"/>
+</g>
+</g>
+</svg>
diff --git a/docs/user-guide/index.md b/docs/user-guide/index.md
index 22fe6a95..fb0738e6 100644
--- a/docs/user-guide/index.md
+++ b/docs/user-guide/index.md
@@ -10,6 +10,7 @@ executors
 storage
 memory
 reliability
+optimization
 scaling
 diagnostics
 ```
diff --git a/docs/user-guide/optimization.md b/docs/user-guide/optimization.md
new file mode 100644
index 00000000..3844d581
--- /dev/null
+++ b/docs/user-guide/optimization.md
@@ -0,0 +1,120 @@
+# Optimization
+
+Cubed will automatically optimize the computation graph before running it. This can reduce the number of tasks in the plan, and the amount of intermediate IO, both of which speed up the computation.
+
+## Map fusion
+
+The simplest kind of optimization is _map fusion_, where operations that have one preceding operation with the same number of tasks are fused together. This optimization is enabled by default.
+
+You can see the effect of optimization before running any computation by using the `visualize` method on a Cubed array, such as in the following small example. We start by specifying `optimize_graph=False` to turn off optimization so we can see what the unoptimized plan looks like.
+
+```python
+import cubed.array_api as xp
+
+a = xp.asarray([[1, 2, 3], [4, 5, 6], [7, 8, 9]], chunks=(2, 2))
+b = xp.negative(a)
+c = xp.astype(b, xp.float32)
+
+c.visualize("cubed-unoptimized", optimize_graph=False)
+```
+
+![Computation with optimization turned off](../images/optimization_turned_off.svg)
+
+Now we call `visualize` again, this time not setting `optimize_graph` so it picks up its default value of `True`.
+
+```python
+c.visualize()
+```
+
+![Map fusion optimization](../images/optimization_map_fusion.svg)
+
+Note that with optimization turned on, the array `b` is no longer written as an intermediate output since it will be computed in the same tasks that compute array `c`. The overall number of tasks is reduced from 10 to 5, and the intermediate data (total `nbytes`) is reduced too.
+
+Here we have just called `visualize` with the `optimize_graph` argument, but it's possible to use it when calling `compute` - which can be useful when debugging a computation.
+
+```python
+c.compute(optimize_graph=False)
+```
+
+## Multiple-input fusion
+
+Cubed supports more powerful optimizations, such as for when an array is created from multiple input arrays. Here is an example, shown first with optimization turned off.
+
+```python
+import cubed.array_api as xp
+
+a = xp.ones((3, 3), chunks=(2, 2))
+b = xp.ones((3, 3), chunks=(2, 2))
+c = xp.ones((3, 3), chunks=(2, 2))
+d = xp.add(b, c)
+e = xp.add(a, d)
+
+e.visualize("cubed-unoptimized", optimize_graph=False)
+```
+
+![Multiple inputs unoptimized](../images/optimization_multiple_inputs_unoptimized.svg)
+
+And with optimization turned on (the default):
+
+```python
+e.visualize()
+```
+
+![Multiple inputs optimized](../images/optimization_multiple_inputs.svg)
+
+Notice how the array `d` is fused away.
+
+## Debugging optimization
+
+Sometimes it can be difficult to understand why particular operations in a computation plan have been fused together - or more commonly, why they have *not* been fused. By enabling debug logging you can get detailed information from the optimize function to help you understand which operations are being fused - or not - and the reason in either case.
+
+Here's the previous example with logging enabled:
+
+```python
+import logging
+
+logging.basicConfig(level=logging.DEBUG)
+
+e.visualize()
+```
+
+The output explains which operations can or can't be fused, and why:
+
+```
+DEBUG:cubed.core.optimization:can't fuse op-001 since it is not a primitive operation, or it uses map_direct
+DEBUG:cubed.core.optimization:can't fuse op-002 since it is not a primitive operation, or it uses map_direct
+DEBUG:cubed.core.optimization:can't fuse op-003 since it is not a primitive operation, or it uses map_direct
+DEBUG:cubed.core.optimization:can't fuse op-004 since no predecessor ops can be fused
+DEBUG:cubed.primitive.blockwise:can fuse op-005 since num tasks of predecessor ops match
+```
+
+## Advanced settings
+
+There are limits to how many input arrays and input chunks reads are fused together. These are imposed so that the number of reads that an individual task must perform is not excessive, which would otherwise result in slow running tasks.
+
+In some cases you may want to change these limits, which we look at here.
+
+### Total number of source arrays
+
+Cubed will not fuse operations that result in more than 4 source arrays in the fused operation. In the previous example above the fused operation has three source arrays (`a`, `b`, and `c`), which is below the maximum default allowed. On the other hand, a computation with a higher "fan-in" that exceeds the maximum will not be fused, or operations will be fused in stages.
+
+To change this, we have to specify the `optimize_function` that Cubed should use: `multiple_inputs_optimize_dag`. In addition, we use `fuctools.partial` to set the `max_total_source_arrays` argument to 8 as follows:
+
+```python
+from functools import partial
+from cubed.core.optimization import multiple_inputs_optimize_dag
+
+opt_fn = partial(multiple_inputs_optimize_dag, max_total_source_arrays=8)
+e.visualize(optimize_function=opt_fn)
+```
+
+### Total number of input blocks
+
+The `max_total_num_input_blocks` argument to `multiple_inputs_optimize_dag` specifies the maximum number of input blocks (chunks) that are allowed in the fused operation.
+
+Again, this is to limit the number of reads that an individual task must perform. The default is `None`, which means that operations are fused only if they have the same number of tasks. If set to an integer, then this limitation is removed, and tasks with a different number of tasks will be fused - as long as the total number of input blocks does not exceed the maximum. This setting is useful for reductions, and can be set using `functools.partial`:
+
+```python
+opt_fn = partial(multiple_inputs_optimize_dag, max_total_num_input_blocks=10)
+e.visualize(optimize_function=opt_fn)
+```