diff --git a/docs/distributed.rst b/docs/distributed.rst
index 8b68697f..5bd5c282 100644
--- a/docs/distributed.rst
+++ b/docs/distributed.rst
@@ -23,8 +23,8 @@ but making it available in the GUI is another good PR or feature request.
 Examples
 ~~~~~~~~
 
-Run distributed Cellpose on half the resources of a workstation that has 16 cpus, 1 gpu, and 128GB system memory:
-............................
+Run distributed Cellpose on half the resources of a workstation that has 16 cpus, 1 gpu,
+and 128GB system memory:
 
 .. code-block:: python
 
@@ -60,3 +60,72 @@ Run distributed Cellpose on half the resources of a workstation that has 16 cpus
     )
 
 
+Test run a single block before distributing the whole dataset (always a good idea):
+
+.. code-block:: python
+
+    from cellpose.contrib.distributed_segmentation import process_block
+
+    # parameterize cellpose however you like
+    model_kwargs = {'gpu':True, 'model_type':'cyto3'}
+    eval_kwargs = {'diameter':30,
+                   'z_axis':0,
+                   'channels':[0,0],
+                   'do_3D':True,
+    }
+    
+    # define a crop as the distributed function would
+    starts = (128, 128, 128)
+    blocksize = (256, 256, 256)
+    overlap = 60
+    crop = tuple(slice(s-overlap, s+b+overlap) for s, b in zip(starts, blocksize))
+    
+    # call the segmentation
+    segments, boxes, box_ids = process_block(
+        block_index=(0, 0, 0),  # when test_mode=True this is just a dummy value
+        crop=crop,
+        input_zarr=my_zarr_array,
+        model_kwargs=model_kwargs,
+        eval_kwargs=eval_kwargs,
+        blocksize=blocksize,
+        overlap=overlap,
+        output_zarr=None,
+        test_mode=True,
+    )
+
+
+Run distributed Cellpose on an LSF cluster with 128 GPUs (e.g. Janelia cluster):
+
+.. code-block:: python
+
+    from cellpose.contrib.distributed_segmentation import distributed_eval
+    
+    # parameterize cellpose however you like
+    model_kwargs = {'gpu':True, 'model_type':'cyto3'}
+    eval_kwargs = {'diameter':30,
+                   'z_axis':0,
+                   'channels':[0,0],
+                   'do_3D':True,
+    }
+    
+    # define LSFCluster parameters
+    cluster_kwargs = {
+        'ncpus':2,                # cpus per worker
+        'min_workers':8,          # cluster adapts number of workers based on number of blocks
+        'max_workers':128,
+        'queue':'gpu_l4',         # flags required to specify a gpu job may differ between clusters
+        'job_extra_directives':['-gpu "num=1"'],
+    }
+    
+    # run segmentation
+    # outputs:
+    #     segments: zarr array containing labels
+    #     boxes: list of bounding boxes around all labels (very useful for navigating big data)
+    segments, boxes = distributed_eval(
+        input_zarr=large_zarr_array,
+        blocksize=(256, 256, 256),
+        write_path='/where/zarr/array/containing/results/will/be/written.zarr',
+        model_kwargs=model_kwargs,
+        eval_kwargs=eval_kwargs,
+        cluster_kwargs=cluster_kwargs,
+    )