diff --git a/docs/Project.toml b/docs/Project.toml
new file mode 100644
index 0000000..f969780
--- /dev/null
+++ b/docs/Project.toml
@@ -0,0 +1,10 @@
+[deps]
+Documenter = "e30172f5-a6a5-5a46-863b-614d45cd2de4"
+MemPool = "f9f48841-c794-520a-933b-121f7ba6ed94"
+
+[compat]
+Documenter = "1"
+julia = "1.11"
+
+[sources]
+MemPool = {path = ".."}
\ No newline at end of file
diff --git a/docs/make.jl b/docs/make.jl
new file mode 100644
index 0000000..5a682e9
--- /dev/null
+++ b/docs/make.jl
@@ -0,0 +1,25 @@
+using MemPool
+using Documenter
+import Documenter.Remotes: GitHub
+
+makedocs(;
+modules = [MemPool],
+authors = "JuliaParallel and contributors",
+repo = GitHub("JuliaParallel", "MemPool.jl"),
+sitename = "MemPool.jl",
+format = Documenter.HTML(;
+prettyurls = get(ENV, "CI", "false") == "true",
+canonical = "https://juliaparallel.github.io/MemPool.jl",
+/*assets = String["assets/favicon.ico"],*/
+),
+pages = [
+"Home" => "index.md",
+"API Reference" => "api.md",
+],
+warnonly = [:missing_docs]
+)
+
+deploydocs(;
+repo = "github.com/JuliaParallel/MemPool.jl",
+devbranch = "master",
+)
\ No newline at end of file
diff --git a/docs/src/api.md b/docs/src/api.md
new file mode 100644
index 0000000..e69de29
diff --git a/docs/src/index.md b/docs/src/index.md
new file mode 100644
index 0000000..52e4dbb
--- /dev/null
+++ b/docs/src/index.md
@@ -0,0 +1,132 @@
+# MemPool: A framework for out-of-core and parallel execution
+
+MemPool.jl is both a framework and in-memory datababse for storing and accessing Julia
+objects, where those objects may live on local or remote (distributed) Julia processes.
+This allows for communicating about data stored on remote workers, and even data
+potentially paged-out to disk, with a single simple reference (the `DRef`).
+
+As a database, MemPool stores references to objects, and also acts as a "gatekeeper"
+when those objects are later accessed through their reference. It can be configured to
+page data out to disk, and then when data is accessed, will page out other data to make
+space in RAM for this newly-loaded data. This allows MemPool to provide "out-of-core"
+data management for libraries or applications - Dagger.jl is one such library that utilizes
+MemPool for this purpose.
+
+
+### Remote Workers Caveat
+
+When using MemPool with multiple workers, make sure that the workers are
+initialized *before* importing MemPool. This ensures the package is loaded on all nodes:
+```julia-repl
+julia> using Distributed
+
+julia> addprocs(2)
+
+julia> using MemPool
+```
+
+-----
+
+## Quickstart: Data Management
+
+For more details: [Data Management](@ref)
+
+The core of MemPool revolves around the `DRef` (Distributed Reference). A `DRef` is a pointer
+to data that might live in local RAM, remote RAM, or on disk.
+
+### Creating and retreiving data
+
+Use `poolset` to register data with the pool and `poolget` to retrieve the actual value:
+
+```julia
+using MemPool
+
+A = rand(1000, 1000)
+ref = poolset(A)
+
+A_retrieved = poolget(ref)
+```
+This will track a large array (`A`) as a `DRef` using `poolset(A)`. 
+You can now safely clear the reference `A` (such as by `A = nothing`),
+and later retrieve `A` from the `DRef` using `poolget(ref)`.
+
+
+### Manual Worker Assignment
+
+You can force data to be stored on a specific worker by passing a worker ID to 'poolset':
+
+```julia
+ref_w2 = poolset(rand(500), 2)
+```
+
+Note that if the current worker is not worker 2, this will make a copy of the array
+from `rand(500)` on worker 2, and will not share memory with the original array.
+
+## Quickstart: Out-of-Core Configuration
+
+MemPool provides helper functions to setup out-of-core data management for all
+`DRef`s created with `poolset`.
+
+### Enabling the Disk Cache
+
+```julia
+# 1. Define the configuration
+cfg = MemPool.DiskCacheConfig(
+    toggle = true,
+    membound = 4 * 1024^3,                  # 4GB RAM Limit
+    diskpath = "/tmp/mempool_cache",        # Disk storage location
+    allocator_type = "LRU"                  # Least Recently Used eviction
+)
+
+# 2. Apply the configuration
+MemPool.setup_global_device!(cfg)
+```
+
+When the amount of data tracked by MemPool exceeds `membound` in byte size,
+MemPool will perform activities such as triggering a GC sweep, or swapping other
+data to `diskpath` and removing that other data from memory. Note that `diskpath`
+must be a directory - each piece of data gets it own file.
+
+### Memory Reservation Logic
+
+MemPool includes an `ensure_memory_reserved` mechanism, which prevents memory
+usage from exceeding a set global memory boundary. When a `poolset` is called,
+the system checks if the OS is running tight on memory. If so, it will:
+1. Trigger a local GC.
+2. If memory is still tight, trigger a full `GC.gc(true)`.
+3. Finally, trigger a cluster-wide GC (`@everywhere GC.gc(true)`). 
+
+This mechanism is separate from the `DiskCacheConfig` logic, and can be configured by
+tuning `MemPool.MEM_RESERVED[]` (this is specified in terms of the minimum number
+of bytes that must be free for use by the OS).
+
+
+## Quickstart: Persistence & Migration
+
+### Migrating Data Between Workers
+
+If necessary, data can be moved (copied) from one worker to another, without breaking
+existing `DRef` references:
+
+```julia
+# Move data from current owner to worker 3
+new_ref = MemPool.migrate!(ref, 3)
+```
+
+While it does return `new_ref` (a reference to the newly-copied data on worker 3),
+accesses to `ref` will also automatically redirect to `new_ref` during `poolget`.
+This can be very helpful to seamlessly migrate data when it would be more efficient
+to read the data from another worker. Dagger.jl uses this mechanism for its streaming
+API, which uses it to migrate streaming tasks to other workers while they run.
+
+### Managed File I/O
+
+Treat files as managed `DRef` objects to avoid loading massive datasets into RAM all at once:
+
+```julia
+#Create a lazy refence (handled by dagger)
+f = Dagger.File("large_dataset.jls")
+
+#When you fetch, MemPool manages the resulting memory
+data = fetch(f)
+```
diff --git a/src/datastore.jl b/src/datastore.jl
index a58b999..816fea4 100644
--- a/src/datastore.jl
+++ b/src/datastore.jl
@@ -6,6 +6,13 @@ else
     import Distributed: ClusterSerializer, worker_id_from_socket
 end
 
+"""
+    DRef(owner::Int, id::Int, size::UInt)
+
+A Distributed Reference (DRef)  which acts as a handle to store data in MemPool.
+It tracks which worker 'owner' holds the data and a unique 'id' assigned to the data.
+'size' stores an aproximation of the in-memory byte size of the object.
+"""
 mutable struct DRef
     owner::Int
     id::Int
@@ -451,6 +458,12 @@ function ensure_memory_reserved(size::Integer=0; max_sweeps::Integer=MEM_RESERVE
     end
 end
 
+"""
+    poolset(x, [pid]; kwargs...) -> DRef
+    
+Stores the value 'x' into the memory pool on worker 'pid' (defaults to myid())
+and returns a 'DRef' handle that can be used to later access the value. 
+"""
 function poolset(@nospecialize(x), pid=myid(); size=approx_size(x),
                  retain=false, restore=false,
                  device=GLOBAL_DEVICE[], leaf_device=initial_leaf_device(device),
@@ -523,6 +536,12 @@ function forwardkeyerror(f)
     end
 end
 
+"""
+    poolget(ref::DRef)
+
+Retrieves the data value referenced by 'ref'. If the data is remote or 
+on disk, MemPool handles the retrieval automatically.
+"""
 function poolget(ref::DRef)
     DEBUG_REFCOUNTING[] && _enqueue_work(Core.print, "?? (", ref.owner, ", ", ref.id, ") at ", myid(), "\n")
     return access_ref(identity, ref)