JuliaParallel
diff --git a/Diff for: ‎Project.toml
+1 b/Diff for: ‎Project.toml
+1
diff --git a/Diff for: ‎docs/make.jl
+1 b/Diff for: ‎docs/make.jl
+1
diff --git a/Diff for: ‎docs/src/datadeps.md
+55 b/Diff for: ‎docs/src/datadeps.md
+55
diff --git a/Diff for: ‎src/Dagger.jl
+4 b/Diff for: ‎src/Dagger.jl
+4
@@ -5,6 +5,7 @@ version = "0.18.6"
 [deps]
 DataStructures = "864edb3b-99cc-5e75-8d2d-829cb0a9cfe8"
 Distributed = "8ba89e20-285c-5b6f-9357-94700520ee1b"
+Graphs = "86223c79-3864-5bf0-83f7-82e725a168b6"
 LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"
 MacroTools = "1914dd2f-81c6-5fcd-8719-6d5c9610ff09"
 MemPool = "f9f48841-c794-520a-933b-121f7ba6ed94"
 
@@ -22,6 +22,7 @@ makedocs(;
         "Scopes" => "scopes.md",
         "Processors" => "processors.md",
         "Task Queues" => "task-queues.md",
+        "Datadeps" => "datadeps.md",
         "Option Propagation" => "propagation.md",
         "Logging and Graphing" => "logging.md",
         "Checkpointing" => "checkpointing.md",
 
@@ -0,0 +1,55 @@
+# Datadeps (Data Dependencies)
+
+For many programs, the restriction that tasks cannot write to their arguments
+feels overly restrictive and makes certain kinds of programs (such as in-place
+linear algebra) hard to express efficiently in Dagger. Thankfully, there is a
+solution: `spawn_datadeps`. This function constructs a "datadeps region",
+within which tasks are allowed to write to their arguments, with parallelism
+controlled via dependencies specified via argument annotations. Let's look at
+a simple example to make things concrete:
+
+```julia
+A = rand(1000)
+B = rand(1000)
+C = zeros(1000)
+add!(X, Y) = X .+= Y
+Dagger.spawn_datadeps() do
+    Dagger.@spawn add!(InOut(B), In(A))
+    Dagger.@spawn copyto!(Out(C), In(B))
+end
+```
+
+In this example, we have two Dagger tasks being launched, one adding `A` into
+`B`, and the other copying `B` into `C`. The `add!` task is specifying that
+`A` is being only read from (`In` for "input"), and that `B` is being read
+from and written to (`Out` for "output", `InOut` for "input and output"). The
+`copyto` task, similarly, is specifying that `B` is being read from, and `C`
+is only being written to.
+
+Without `spawn_datadeps` and `In`, `Out`, and `InOut`, the result of these
+tasks would be undefined; the two tasks could execute in parallel, or the
+`copyto!` could occur before the `add!`, resulting in all kinds of mayhem.
+However, `spawn_datadeps` changes things: because we have told Dagger how our
+tasks access their arguments, Dagger knows to control the parallelism and
+ordering, and ensure that `add!` executes and finishes before `copyto!`
+begins, ensuring that `copyto!` "sees" the changes to `B` before executing.
+
+There is another important aspect of `spawn_datadeps` that makes the above
+code work: if all of the `Dagger.@spawn` macros are removed, along with the
+dependency specifiers, the program would still produce the same results,
+without using Dagger. In other words, the parallel (Dagger) version of the
+program produces identical results to the serial (non-Dagger) version of the
+program. This is similar to using Dagger with purely functional tasks and
+without `spawn_datadeps` - removing `Dagger.@spawn` will still result in a
+correct (sequential and possibly slower) version of the program. Basically,
+`spawn_datadeps` will ensure that Dagger respects the ordering and
+dependencies of a program, while still providing parallelism, where possible.
+
+But where is the parallelism? The above example doesn't actually have any
+parallelism to exploit! Let's take a look at another example to see the
+datadeps model truly shine:
+
+```julia
+function tree_reduce!(As::Vector{Array})
+end
+```
@@ -34,6 +34,7 @@ include("queue.jl")
 include("thunk.jl")
 include("submission.jl")
 include("chunks.jl")
+include("memory-spaces.jl")
 
 # Task scheduling
 include("compute.jl")
@@ -42,6 +43,9 @@ include("utils/system_uuid.jl")
 include("utils/caching.jl")
 include("sch/Sch.jl"); using .Sch
 
+# Data dependency task queue
+include("datadeps.jl")
+
 # Array computations
 include("array/darray.jl")
 include("array/alloc.jl")