diff --git a/pyproject.toml b/pyproject.toml
index 2668d82..cd5acc1 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -19,7 +19,6 @@ urls.Documentation = "https://Nimbus-Inference.readthedocs.io/"
 urls.Source = "https://github.com/angelolab/Nimbus-Inference"
 urls.Home-page = "https://github.com/angelolab/Nimbus-Inference"
 dependencies = [
-    "ark-analysis",
     "torch>=2.2.0",
     "alpineer",
     "scikit-image",
diff --git a/src/nimbus_inference/example_dataset.py b/src/nimbus_inference/example_dataset.py
new file mode 100644
index 0000000..6642085
--- /dev/null
+++ b/src/nimbus_inference/example_dataset.py
@@ -0,0 +1,217 @@
+# Code copied from github.com/angelolab/ark-analysis
+import pathlib
+import shutil
+import warnings
+from typing import Union
+import datasets
+from alpineer.misc_utils import verify_in_list
+
+EXAMPLE_DATASET_REVISION: str = "main"
+
+
+class ExampleDataset:
+    def __init__(self, dataset: str, overwrite_existing: bool = True, cache_dir: str = None,
+                 revision: str = None) -> None:
+        """
+        Constructs a utility class for downloading and moving the dataset with respect to it's
+        various partitions on Hugging Face: https://huggingface.co/datasets/angelolab/ark_example.
+
+        Args:
+            dataset (str): The name of the dataset to download. Can be one of
+
+                    * `"segment_image_data"`
+                    * `"cluster_pixels"`
+                    * `"cluster_cells"`
+                    * `"post_clustering"`
+                    * `"fiber_segmentation"`
+                    * `"LDA_preprocessing"`
+                    * `"LDA_training_inference"`
+                    * `"neighborhood_analysis"`
+                    * `"pairwise_spatial_enrichment"`
+                    * `"ome_tiff"`
+                    * `"ez_seg_data"`
+            overwrite_existing (bool): A flag to overwrite existing data. Defaults to `True`.
+            cache_dir (str, optional): The directory to save the cache dir. Defaults to `None`,
+                which internally in Hugging Face defaults to `~/.cache/huggingface/datasets`.
+            revision (str, optional): The commit ID from Hugging Face for the dataset. Used for
+                internal development only. Allows the user to fetch a commit from a particular
+                `revision` (Hugging Face's terminology for branch). Defaults to `None`. Which
+                defaults to the latest version in the `main` branch.
+                (https://huggingface.co/datasets/angelolab/ark_example/tree/main).
+        """
+        self.dataset_paths = None
+        self.dataset = dataset
+        self.overwrite_existing = overwrite_existing
+        self.cache_dir = cache_dir if cache_dir else pathlib.Path("~/.cache/huggingface/datasets").expanduser()
+        self.revision = revision
+
+        self.path_suffixes = {
+            "image_data": "image_data",
+            "cell_table": "segmentation/cell_table",
+            "deepcell_output": "segmentation/deepcell_output",
+            "example_pixel_output_dir": "pixie/example_pixel_output_dir",
+            "example_cell_output_dir": "pixie/example_cell_output_dir",
+            "spatial_lda": "spatial_analysis/spatial_lda",
+            "post_clustering": "post_clustering",
+            "ome_tiff": "ome_tiff",
+            "ez_seg_data": "ez_seg_data"
+        }
+        """
+        Path suffixes for mapping each downloaded dataset partition to it's appropriate
+        relative save directory.
+        """
+
+    def download_example_dataset(self):
+        """
+        Downloads the example dataset from Hugging Face Hub.
+        The following is a link to the dataset used:
+        https://huggingface.co/datasets/angelolab/ark_example
+
+        The dataset will be downloaded to the Hugging Face default cache
+        `~/.cache/huggingface/datasets`.
+        """
+        ds_paths = datasets.load_dataset(path="angelolab/ark_example",
+                                                   revision=self.revision,
+                                                   name=self.dataset,
+                                                   cache_dir=self.cache_dir,
+                                                   token=False,
+                                                   trust_remote_code=True)
+
+        # modify the paths to be relative to the os
+        # For example:
+        # '/Users/user/.cache/huggingface/datasets/downloads/extracted/<hash>'
+        # becomes 'pathlib.path(self.dataset_cache) / downloads/extracted/<hash>/<feature_name>'
+        self.dataset_paths = {}
+        for ds_name,ds in ds_paths.items():
+            self.dataset_paths[ds_name] = {}
+            for feature in ds.features:
+                p, = ds[feature]
+                # extract the path relative to the cache_dir (last 3 parts of the path)
+                p = pathlib.Path(*pathlib.Path(p).parts[-3:])
+                # Set the start of the path to the cache_dir (for the user's machine)
+                self.dataset_paths[ds_name][feature] = self.cache_dir / p / feature
+
+
+    def check_empty_dst(self, dst_path: pathlib.Path) -> bool:
+        """
+        Checks to see if the folder for a dataset config already exists in the `save_dir`
+        (i.e. `dst_path` is the specific folder for the config.). If the folder exists, and
+        there are no contents, then it'll return True, False otherwise.
+
+        Args:
+            dst_path (pathlib.Path): The destination directory to check to see if
+            files exist in it.
+
+        Returns:
+            bool: Returns `True` if there are no files in the directory `dst_path`.
+                Returns `False` if there are files in that directory `dst_path`.
+        """
+        dst_files = list(dst_path.rglob("*"))
+
+        if len(dst_files) == 0:
+            return True
+        else:
+            return False
+
+    def move_example_dataset(self, move_dir: Union[str, pathlib.Path]):
+        """
+        Moves the downloaded example data from the `cache_dir` to the `save_dir`.
+
+        Args:
+            move_dir (Union[str, pathlib.Path]): The path to save the dataset files in.
+        """
+        if type(move_dir) is not pathlib.Path:
+            move_dir = pathlib.Path(move_dir)
+
+        dataset_names = list(self.dataset_paths[self.dataset].keys())
+
+        for ds_n in dataset_names:
+            ds_n_suffix: str = pathlib.Path(self.path_suffixes[ds_n])
+
+            # The path where the dataset is saved in the Hugging Face Cache post-download,
+            # Necessary to copy + move the data from the cache to the user specified `move_dir`.
+            src_path = pathlib.Path(self.dataset_paths[self.dataset][ds_n])
+            dst_path: pathlib.Path = move_dir / ds_n_suffix
+
+            # Overwrite the existing dataset when `overwrite_existing` == `True`
+            # and when the `dst_path` is empty.
+
+            # `True` if `dst_path` is empty, `False` if data exists in `dst_path`
+            empty_dst_path: bool = self.check_empty_dst(dst_path=dst_path)
+
+            if self.overwrite_existing:
+                if not empty_dst_path:
+                    warnings.warn(UserWarning(f"Files exist in {dst_path}. \
+                        They will be overwritten by the downloaded example dataset."))
+
+                # Remove files in the destination path
+                [f.unlink() for f in dst_path.glob("*") if f.is_file()]
+                # Fill destination path
+                shutil.copytree(src_path, dst_path, dirs_exist_ok=True,
+                                ignore=shutil.ignore_patterns(r"\.\!*"))
+            else:
+                if empty_dst_path:
+                    warnings.warn(UserWarning(f"Files do not exist in {dst_path}. \
+                        The example dataset will be added in."))
+                    shutil.copytree(src_path, dst_path, dirs_exist_ok=True,
+                                    ignore=shutil.ignore_patterns(r"\.\!*"))
+                else:
+                    warnings.warn(UserWarning(f"Files exist in {dst_path}. \
+                        They will not be overwritten."))
+
+
+def get_example_dataset(dataset: str, save_dir: Union[str, pathlib.Path],
+                        overwrite_existing: bool = True):
+    """
+    A user facing wrapper function which downloads a specified dataset from Hugging Face,
+    and moves it to the specified save directory `save_dir`.
+    The dataset may be found here: https://huggingface.co/datasets/angelolab/ark_example
+
+
+    Args:
+        dataset (str): The name of the dataset to download. Can be one of
+
+                * `"segment_image_data"`
+                * `"cluster_pixels"`
+                * `"cluster_cells"`
+                * `"post_clustering"`
+                * `"fiber_segmentation"`
+                * `"LDA_preprocessing"`
+                * `"LDA_training_inference"`
+                * `"neighborhood_analysis"`
+                * `"pairwise_spatial_enrichment"`
+                * `"ez_seg_data"`
+        save_dir (Union[str, pathlib.Path]): The path to save the dataset files in.
+        overwrite_existing (bool): The option to overwrite existing configs of the `dataset`
+            downloaded. Defaults to True.
+    """
+
+    valid_datasets = ["segment_image_data",
+                      "cluster_pixels",
+                      "cluster_cells",
+                      "post_clustering",
+                      "fiber_segmentation",
+                      "LDA_preprocessing",
+                      "LDA_training_inference",
+                      "neighborhood_analysis",
+                      "pairwise_spatial_enrichment",
+                      "ome_tiff",
+                      "ez_seg_data"]
+
+    # Check the appropriate dataset name
+    try:
+        verify_in_list(dataset=dataset, valid_datasets=valid_datasets)
+    except ValueError:
+        err_str: str = f"""The dataset \"{dataset}\" is not one of the valid datasets available.
+        The following are available: {*valid_datasets,}"""
+        raise ValueError(err_str) from None
+
+    example_dataset = ExampleDataset(dataset=dataset, overwrite_existing=overwrite_existing,
+                                     cache_dir=None,
+                                     revision=EXAMPLE_DATASET_REVISION)
+
+    # Download the dataset
+    example_dataset.download_example_dataset()
+
+    # Move the dataset over to the save_dir from the user.
+    example_dataset.move_example_dataset(move_dir=save_dir)
\ No newline at end of file
diff --git a/tests/test_example_dataset.py b/tests/test_example_dataset.py
new file mode 100644
index 0000000..75e8959
--- /dev/null
+++ b/tests/test_example_dataset.py
@@ -0,0 +1,627 @@
+# copied from github.com/angelolab/ark-analysis
+import pathlib
+import shutil
+from typing import Callable, Generator, Iterator, List, Union
+import pytest
+import os
+from pathlib import Path
+from alpineer import test_utils
+from nimbus_inference.example_dataset import (ExampleDataset, get_example_dataset,
+                                              EXAMPLE_DATASET_REVISION)
+
+
+@pytest.fixture(scope="class", params=["segment_image_data",
+                                       "cluster_pixels",
+                                       "cluster_cells",
+                                       "post_clustering",
+                                       "fiber_segmentation",
+                                       "LDA_preprocessing",
+                                       "LDA_training_inference",
+                                       "neighborhood_analysis",
+                                       "pairwise_spatial_enrichment",
+                                       "ome_tiff",
+                                       "ez_seg_data"])
+def dataset_download(request, dataset_cache_dir) -> Iterator[ExampleDataset]:
+    """
+    A Fixture which instantiates and downloads the dataset with respect to each
+    notebook.
+
+    Args:
+        request (pytest.FixtureRequest): The parameter, in this case it is the notebook to
+            download the dataset for.
+
+    Yields:
+        Iterator[ExampleDataset]: The iterable Example Dataset.
+    """
+    # Set up ExampleDataset class
+    example_dataset = ExampleDataset(
+        dataset=request.param,
+        cache_dir=dataset_cache_dir,
+        revision=EXAMPLE_DATASET_REVISION
+    )
+
+    # Download example data for a particular notebook
+    example_dataset.download_example_dataset()
+    yield example_dataset
+
+
+@pytest.fixture(scope="function")
+def cleanable_tmp_path(tmp_path_factory: pytest.TempPathFactory) -> Iterator[pathlib.Path]:
+    data_path = tmp_path_factory.mktemp("data")
+    yield data_path
+    shutil.rmtree(data_path)
+
+
+@pytest.fixture(scope="class")
+def dataset_cache_dir() -> Iterator[Union[str, None]]:
+    # Change cache directory if running on CI
+    if os.environ.get("CI", None):
+        cache_dir = (Path(os.environ.get("GITHUB_WORKSPACE")) / "data" / "cache").resolve()
+    else:
+        cache_dir = None
+    yield cache_dir
+
+
+class TestExampleDataset:
+    @pytest.fixture(autouse=True)
+    def _setup(self):
+        """
+        Sets up necessary information needed for assert statements.
+        Sets up dictionary to call the functions which check each dataset that is downloaded.
+        """
+        self.fov_names = [f"fov{i}" for i in range(11)]
+        self.channel_names = ["CD3", "CD4", "CD8", "CD14", "CD20", "CD31", "CD45", "CD68",
+                              "CD163", "CK17", "Collagen1", "ECAD", "Fibronectin", "GLUT1",
+                              "H3K9ac", "H3K27me3", "HLADR", "IDO", "Ki67", "PD1", "SMA", "Vim"]
+
+        self.cell_table_names = ["cell_table_arcsinh_transformed", "cell_table_size_normalized",
+                                 "cell_table_size_normalized_cell_labels",
+                                 "generalized_cell_table_input"]
+
+        self.deepcell_output_names = [f"fov{i}_{j}" for i in range(11)
+                                      for j in ['whole_cell', 'nuclear']]
+
+        self._example_pixel_output_dir_names = {
+            "root_files": ["cell_clustering_params", "channel_norm_pre_rownorm", "pixel_thresh",
+                           "pixel_channel_avg_meta_cluster", "pixel_channel_avg_som_cluster",
+                           "pixel_meta_cluster_mapping", "pixel_som_weights",
+                           "channel_norm_post_rownorm"],
+            "pixel_mat_data": [f"fov{i}" for i in range(11)],
+            "pixel_mat_subset": [f"fov{i}" for i in range(11)],
+            "pixel_masks": [f"fov{i}_pixel_mask" for i in range(2)]
+        }
+
+        self._example_cell_output_dir_names = {
+            "root_files": ["cell_meta_cluster_channel_avg",
+                           "cell_meta_cluster_count_avg",
+                           "cell_som_cluster_channel_avg",
+                           "cell_meta_cluster_mapping",
+                           "cell_som_cluster_channel_avg",
+                           "cell_som_cluster_count_avg",
+                           "cell_som_weights", "cluster_counts",
+                           "cluster_counts_size_norm", "weighted_cell_channel"],
+            "cell_masks": [f"fov{i}_cell_mask" for i in range(2)]
+        }
+
+        self._spatial_analysis_lda_preprocessed_files: List[str] = [
+            "difference_mats",
+            "featurized_cell_table",
+            "formatted_cell_table",
+            "fov_stats",
+            "topic_eda"]
+
+        self._post_clustering_files = ["cell_table_thresholded",
+                                       "marker_thresholds", "updated_cell_table"]
+
+        self._ome_tiff_files: List[str] = ["fov1.ome"]
+
+        self._ez_seg_files = {
+            "fov_names": [f"fov{i}" for i in range(10)],
+            "channel_names": [
+                "Ca40",
+                "GFAP",
+                "Synaptophysin",
+                "PanAmyloidbeta1724",
+                "Na23",
+                "Reelin",
+                "Presenilin1NTF",
+                "Iba1",
+                "CD105",
+                "C12",
+                "EEA1",
+                "VGLUT1",
+                "PolyubiK63",
+                "Ta181",
+                "Au197",
+                "Si28",
+                "PanGAD6567",
+                "CD33Lyo",
+                "MAP2",
+                "Calretinin",
+                "PolyubiK48",
+                "MAG",
+                "TotalTau",
+                "Amyloidbeta140",
+                "Background",
+                "CD45",
+                "8OHGuano",
+                "pTDP43",
+                "ApoE4",
+                "PSD95",
+                "TH",
+                "HistoneH3Lyo",
+                "CD47",
+                "Parvalbumin",
+                "Amyloidbeta142",
+                "Calbindin",
+                "PanApoE2E3E4",
+                "empty139",
+                "CD31",
+                "MCT1",
+                "MBP",
+                "SERT",
+                "PHF1Tau",
+                "VGAT",
+                "VGLUT2",
+                "CD56Lyo",
+                "MFN2",
+            ],
+            "composite_names": [
+                "amyloid",
+                "microglia-composite",
+            ],
+            "ez_mask_suffixes": ["microglia-projections", "plaques"],
+            "merged_mask_suffixes":
+                ["final_whole_cell_remaining", "microglia-projections_merged"],
+            "final_mask_suffixes":
+                ["final_whole_cell_remaining", "microglia-projections_merged", "plaques"],
+            "cell_table_names": [
+                "cell_and_objects_table_arcsinh_transformed",
+                "cell_and_objects_table_size_normalized",
+                "filtered_final_whole_cell_remaining_table_arcsinh_transformed",
+                "filtered_final_whole_cell_remaining_table_size_normalized",
+                "filtered_microglia-projections_merged_table_arcsinh_transformed",
+                "filtered_microglia-projections_merged_table_size_normalized",
+                "filtered_plaques_table_arcsinh_transformed",
+                "filtered_plaques_table_size_normalized",
+            ],
+            "log_names": [
+                "amyloid_composite_log",
+                "mask_merge_log",
+                "microglia-composite_composite_log",
+                "microglia-projections_segmentation_log",
+                "plaques_segmentation_log"
+            ],
+        }
+
+        # Mapping the datasets to their respective test functions.
+        self.dataset_test_fns: dict[str, Callable] = {
+            "image_data": self._image_data_check,
+            "cell_table": self._cell_table_check,
+            "deepcell_output": self._deepcell_output_check,
+            "example_pixel_output_dir": self._example_pixel_output_dir_check,
+            "example_cell_output_dir": self._example_cell_output_dir_check,
+            "spatial_lda": self._spatial_lda_output_dir_check,
+            "post_clustering": self._post_clustering_output_dir_check,
+            "ome_tiff": self._ome_tiff_check,
+            "ez_seg_data": self._ez_seg_data_check
+        }
+
+        # Should be the same as `example_dataset.ExampleDataset.path_suffixes`
+        self.move_path_suffixes = {
+            "image_data": "image_data",
+            "cell_table": "segmentation/cell_table",
+            "deepcell_output": "segmentation/deepcell_output",
+            "example_pixel_output_dir": "pixie/example_pixel_output_dir",
+            "example_cell_output_dir": "pixie/example_cell_output_dir",
+            "spatial_lda": "spatial_analysis/spatial_lda",
+            "post_clustering": "post_clustering",
+            "ome_tiff": "ome_tiff",
+            "ez_seg_data": "ez_seg_data",
+        }
+
+    def test_download_example_dataset(self, dataset_download: ExampleDataset):
+        """
+        Tests to make sure the proper files are downloaded from Hugging Face.
+
+        Args:
+            dataset_download (ExampleDataset): Fixture for the dataset, respective to each
+        """
+        import os
+        dataset_names = list(
+            dataset_download.dataset_paths[dataset_download.dataset].keys()
+        )
+        for ds_n in dataset_names:
+            dataset_cache_path = pathlib.Path(
+                dataset_download.dataset_paths[dataset_download.dataset][ds_n]
+            )
+            self.dataset_test_fns[ds_n](dir_p=dataset_cache_path)
+
+    @pytest.mark.parametrize("_overwrite_existing", [True, False])
+    def test_move_example_dataset(self, cleanable_tmp_path, dataset_download: ExampleDataset,
+                                  _overwrite_existing: bool):
+        """
+        Tests to make sure the proper files are moved to the correct directories.
+
+        Args:
+            cleanable_tmp_path (pytest.TempPathFactory): Factory for temporary directories under
+                the common base temp directory.
+            dataset_download (ExampleDataset): Fixture for the dataset, respective to each
+                partition (`segment_image_data`, `cluster_pixels`, `cluster_cells`,
+                `post_clustering`).
+            _overwrite_existing (bool): If `True` the dataset will be overwritten. If `False` it
+                will not be.
+        """
+        dataset_download.overwrite_existing = _overwrite_existing
+
+        # Move data if _overwrite_existing is `True`
+        if _overwrite_existing:
+
+            # Case 1: Move Path is empty
+            tmp_dir_c1: pathlib.Path = cleanable_tmp_path / "move_example_data_c1"
+            tmp_dir_c1.mkdir(parents=True, exist_ok=False)
+
+            move_dir_c1: pathlib.Path = tmp_dir_c1 / "example_dataset"
+            move_dir_c1.mkdir(parents=True, exist_ok=False)
+
+            dataset_download.move_example_dataset(move_dir=move_dir_c1)
+
+            for dir_p, ds_n in self._suffix_paths(dataset_download, parent_dir=move_dir_c1):
+                self.dataset_test_fns[ds_n](dir_p)
+
+            # Case 2: Move Path contains files
+            tmp_dir_c2: pathlib.Path = cleanable_tmp_path / "move_example_data_c2"
+            tmp_dir_c2.mkdir(parents=True, exist_ok=False)
+
+            move_dir_c2: pathlib.Path = tmp_dir_c2 / "example_dataset"
+            move_dir_c2.mkdir(parents=True, exist_ok=False)
+
+            # Add files for each config to test moving with files
+            for dir_p, ds_n in self._suffix_paths(dataset_download, parent_dir=move_dir_c2):
+                # make directory
+                dir_p.mkdir(parents=True, exist_ok=False)
+                # make blank file
+                test_utils._make_blank_file(dir_p, "data_test.txt")
+
+            # Move files to directory which has existing files
+            # Make sure warning is raised
+            with pytest.warns(UserWarning):
+                dataset_download.move_example_dataset(move_dir=move_dir_c2)
+                for dir_p, ds_n in self._suffix_paths(dataset_download, parent_dir=move_dir_c2):
+                    self.dataset_test_fns[ds_n](dir_p)
+
+        # Move data if _overwrite_existing is `False`
+        else:
+            # Case 1: Move Path is empty
+            tmp_dir_c1: pathlib.Path = cleanable_tmp_path / "move_example_data_c1"
+            tmp_dir_c1.mkdir(parents=True, exist_ok=False)
+            move_dir_c1 = tmp_dir_c1 / "example_dataset"
+            move_dir_c1.mkdir(parents=True, exist_ok=False)
+
+            # Check that the files were moved to the empty directory
+            # Make sure warning is raised
+            with pytest.warns(UserWarning):
+                dataset_download.move_example_dataset(move_dir=move_dir_c1)
+
+                for dir_p, ds_n in self._suffix_paths(dataset_download, parent_dir=move_dir_c1):
+                    self.dataset_test_fns[ds_n](dir_p)
+
+            # Case 2: Move Path contains files
+            tmp_dir_c2 = cleanable_tmp_path / "move_example_data_c2"
+            tmp_dir_c2.mkdir(parents=True, exist_ok=False)
+            move_dir_c2 = tmp_dir_c2 / "example_dataset"
+            move_dir_c2.mkdir(parents=True, exist_ok=False)
+
+            # Add files for each config to test moving with files
+            for dir_p, ds_n in self._suffix_paths(dataset_download, parent_dir=move_dir_c2):
+                # make directory
+                dir_p.mkdir(parents=True, exist_ok=False)
+                # make blank file
+                test_utils._make_blank_file(dir_p, "data_test.txt")
+
+            # Do not move files to directory containing files
+            # Make sure warning is raised.
+            with pytest.warns(UserWarning):
+                dataset_download.move_example_dataset(move_dir=move_dir_c2)
+                for dir_p, ds_n in self._suffix_paths(dataset_download, parent_dir=move_dir_c2):
+                    assert len(list(dir_p.rglob("*"))) == 1
+
+    # Will cause duplicate downloads
+    def test_get_example_dataset(self, cleanable_tmp_path):
+        """
+        Tests to make sure that if an incorrect `dataset` is provided, the function
+        errors out with an appropriate error message for the user.
+        """
+
+        with pytest.raises(ValueError):
+            get_example_dataset("incorrect_dataset", save_dir=cleanable_tmp_path)
+
+    def test_check_empty_dst(self, tmp_path):
+        """
+        Tests to make sure that `ExampleDataset.check_empty_dst()` accurately
+        reports if a directory contains files or not.
+        """
+
+        example_dataset = ExampleDataset(None)
+        empty_data_dir: pathlib.Path = tmp_path / "empty_dst_dir"
+        packed_data_dir: pathlib.Path = tmp_path / "packed_dst_dir"
+        empty_data_dir.mkdir(parents=True)
+        packed_data_dir.mkdir(parents=True)
+
+        # Empty directory has no files
+        assert example_dataset.check_empty_dst(empty_data_dir) is True
+
+        # Directory has files
+        test_utils._make_blank_file(packed_data_dir, "data_test.txt")
+        assert example_dataset.check_empty_dst(packed_data_dir) is False
+
+    def _image_data_check(self, dir_p: pathlib.Path):
+        """
+        Checks to make sure that all the FOVs exist.
+
+        Args:
+            dir (pathlib.Path): The directory to check.
+        """
+        # Check to make sure all the FOVs exist
+        downloaded_fovs = list(dir_p.glob("*"))
+        downloaded_fov_names = [f.stem for f in downloaded_fovs]
+        assert set(self.fov_names) == set(downloaded_fov_names)
+
+        # Check to make sure all 22 channels exist
+        for fov in downloaded_fovs:
+            c_names = [c.stem for c in fov.rglob("*")]
+            assert set(self.channel_names) == set(c_names)
+
+    def _cell_table_check(self, dir_p: pathlib.Path):
+        """
+        Checks to make sure that the following cell tables exist:
+            * `cell_table_arcsinh_transformed.csv`
+            * `cell_table_size_normalized.csv`
+
+        Args:
+            dir_p (pathlib.Path): The directory to check.
+        """
+
+        downloaded_cell_tables = list(dir_p.glob("*.csv"))
+        downloaded_cell_table_names = [f.stem for f in downloaded_cell_tables]
+        assert set(self.cell_table_names) == set(downloaded_cell_table_names)
+
+    def _deepcell_output_check(self, dir_p: pathlib.Path):
+        """
+        Checks to make sure that all cell nucleus (nuclear) and cell membrane masks (whole_cell)
+        exist from deepcell output.
+
+        Args:
+            dir_p (pathlib.Path): The directory to check.
+        """
+        downloaded_deepcell_output = list(dir_p.glob("*.tiff"))
+        downloaded_deepcell_output_names = [f.stem for f in downloaded_deepcell_output]
+        assert set(self.deepcell_output_names) == set(downloaded_deepcell_output_names)
+
+    def _example_pixel_output_dir_check(self, dir_p: pathlib.Path):
+        """
+        `example_pixel_output_dir`.
+            ├── cell_clustering_params.json
+            ├── channel_norm.feather
+            ├── pixel_thresh.feather
+            ├── pixel_channel_avg_meta_cluster.csv
+            ├── pixel_channel_avg_som_cluster.csv
+            ├── pixel_masks/
+            │  ├── fov0_pixel_mask.tiff
+            │  └── fov1_pixel_mask.tiff
+            ├── pixel_mat_data/
+            │  ├── fov0.feather
+            │  ├── fov1.feather
+            │  ├── ...
+            │  └── fov10.feather
+            ├── pixel_mat_subset/
+            │  ├── fov0.feather
+            │  ├── fov1.feather
+            │  ├── ...
+            │  └── fov10.feather
+            ├── pixel_meta_cluster_mapping.csv
+            ├── pixel_som_weights.feather
+            └── channel_norm_post_rowsum.feather
+        ```
+        Args:
+            dir_p (pathlib.Path): The directory to check.
+        """
+        # Root Files
+        root_files = list(dir_p.glob("*.json")) + \
+            list(dir_p.glob("*feather")) + \
+            list(dir_p.glob("*csv"))
+        root_file_names = [f.stem for f in root_files]
+        assert set(self._example_pixel_output_dir_names["root_files"]) == set(root_file_names)
+
+        # Pixel Mat Data
+        pixel_mat_files = list((dir_p / "pixel_mat_data").glob("*.feather"))
+        pixel_mat_files_names = [f.stem for f in pixel_mat_files]
+        assert set(self._example_pixel_output_dir_names["pixel_mat_data"]) \
+            == set(pixel_mat_files_names)
+
+        # Pixel Mat Subset
+        pixel_mat_subset_files = list((dir_p / "pixel_mat_subset").glob("*.feather"))
+        pixel_mat_subset_names = [f.stem for f in pixel_mat_subset_files]
+        assert set(self._example_pixel_output_dir_names["pixel_mat_subset"]) \
+            == set(pixel_mat_subset_names)
+
+        # Pixel Masks
+        pixel_mask_files = list((dir_p / "pixel_masks").glob("*.tiff"))
+        pixel_mask_names = [f.stem for f in pixel_mask_files]
+        assert set(self._example_pixel_output_dir_names["pixel_masks"]) \
+            == set(pixel_mask_names)
+
+    def _example_cell_output_dir_check(self, dir_p: pathlib.Path):
+        """
+        Checks to make sure that the following files exist w.r.t the
+        `example_cell_output_dir`.
+
+        ```
+        example_cell_output_dir/
+        ├── cell_masks/
+        │  ├── fov0_cell_mask.tiff
+        │  └── fov1_cell_mask.tiff
+        ├── cell_meta_cluster_channel_avg.csv
+        ├── cell_meta_cluster_count_avgs.csv
+        ├── cell_meta_cluster_mapping.csv
+        ├── cell_som_cluster_channel_avg.csv
+        ├── cell_som_cluster_count_avgs.csv
+        ├── cell_som_weights.feather
+        ├── cluster_counts.feather
+        ├── cluster_counts_size_norm.feather
+        └── weighted_cell_channel.csv
+        ```
+
+        Args:
+            dir_p (pathlib.Path): The directory to check.
+        """
+
+        # Root Files
+        root_files = list(dir_p.glob("*.feather")) + list(dir_p.glob("*.csv"))
+        root_file_names = [f.stem for f in root_files]
+        assert set(self._example_cell_output_dir_names["root_files"]) == set(root_file_names)
+
+        # Cell Masks
+        cell_mask_files = list((dir_p / "cell_masks").glob("*.tiff"))
+        cell_mask_names = [f.stem for f in cell_mask_files]
+        assert set(self._example_cell_output_dir_names["cell_masks"]) \
+            == set(cell_mask_names)
+
+    def _spatial_lda_output_dir_check(self, dir_p: pathlib.Path):
+        """
+        Checks to make sure that the correct files exist w.r.t the `spatial_lda` output dir
+        `spatial_analysis/spatial_lda/preprocessed`.
+
+        Args:
+            dir_p (pathlib.Path): The directory to check.
+        """
+        downloaded_lda_preprocessed = list((dir_p / "preprocessed").glob("*.pkl"))
+        downloaded_lda_preprocessed_names = [f.stem for f in downloaded_lda_preprocessed]
+        assert set(self._spatial_analysis_lda_preprocessed_files) == set(
+            downloaded_lda_preprocessed_names)
+
+    def _post_clustering_output_dir_check(self, dir_p: pathlib.Path):
+        """
+        Checks to make sure that the correct files exist w.r.t the `post_clustering` output dir
+
+        Args:
+            dir_p (pathlib.Path): The directory to check.
+        """
+        downloaded_post_cluster = list(dir_p.glob("*.csv"))
+        downloaded_post_cluster_names = [f.stem for f in downloaded_post_cluster]
+        assert set(self._post_clustering_files) == set(downloaded_post_cluster_names)
+
+    def _ome_tiff_check(self, dir_p: pathlib.Path):
+        """
+        Checks to make sure that the correct files exist w.r.t the `ome_tiff` output dir
+
+        Args:
+            dir_p (pathlib.Path): The directory to check.
+        """
+        downloaded_ome_tiff = list(dir_p.glob("*.ome.tiff"))
+        downloaded_ome_tiff_names = [f.stem for f in downloaded_ome_tiff]
+        assert set(self._ome_tiff_files) == set(downloaded_ome_tiff_names)
+
+    def _ez_seg_data_check(self, dir_p: pathlib.Path):
+        """
+        Checks to make sure that the correct files exist w.r.t the 'ez_seg_data' output dir
+
+        Args:
+            dir_p (pathlib.Path): The directory to check.
+        """
+        image_data = dir_p / "image_data"
+        composites = dir_p / "composites"
+        cell_tables = dir_p / "cell_table"
+        deepcell_output = dir_p / "segmentation" / "deepcell_output"
+        ez_masks = dir_p / "segmentation" / "ez_masks"
+        merged_masks = dir_p / "segmentation" / "merged_masks_dir"
+        final_masks = dir_p / "segmentation" / "final_mask_dir"
+        mantis_visualization = dir_p / "mantis_visualization"
+        logs = dir_p / "logs"
+
+        # image_data check
+        downloaded_fovs = list(image_data.glob("*"))
+        downloaded_fov_names = [f.stem for f in downloaded_fovs]
+        assert set(self._ez_seg_files["fov_names"]) == set(downloaded_fov_names)
+
+        for fov in downloaded_fovs:
+            c_names = [c.stem for c in fov.rglob("*")]
+            assert set(self._ez_seg_files["channel_names"]) == set(c_names)
+
+        # composites check
+        downloaded_fovs = list(composites.glob("*"))
+        downloaded_fov_names = [f.stem for f in downloaded_fovs]
+        assert set(self._ez_seg_files["fov_names"]) == set(downloaded_fov_names)
+
+        for fov in downloaded_fovs:
+            c_names = [c.stem for c in fov.rglob("*")]
+            assert set(self._ez_seg_files["composite_names"]) == set(c_names)
+
+        # cell tables check
+        downloaded_cell_tables = list(cell_tables.glob("*.csv"))
+        downloaded_cell_table_names = [f.stem for f in downloaded_cell_tables]
+        assert set(self._ez_seg_files["cell_table_names"]) == set(downloaded_cell_table_names)
+
+        # deepcell output check
+        downloaded_whole_cell_seg = list(deepcell_output.glob("*.tiff"))
+        downloaded_whole_cell_names = [f.stem for f in downloaded_whole_cell_seg]
+        actual_whole_cell_names = [f"{fov}_whole_cell" for fov in self._ez_seg_files["fov_names"]]
+        assert set(actual_whole_cell_names) == set(downloaded_whole_cell_names)
+
+        # ezSegmenter masks check
+        downloaded_ez = list(ez_masks.glob("*.tiff"))
+        downloaded_ez_names = [f.stem for f in downloaded_ez]
+        actual_ez_names = [
+            f"{fov}_{ez_suffix}"
+            for fov in self._ez_seg_files["fov_names"]
+            for ez_suffix in self._ez_seg_files["ez_mask_suffixes"]
+        ]
+        assert set(actual_ez_names) == set(downloaded_ez_names)
+
+        # merged masks check
+        downloaded_merged = list(merged_masks.glob("*.tiff"))
+        downloaded_merged_names = [f.stem for f in downloaded_merged]
+        actual_merged_names = [
+            f"{fov}_{merged_mask_suffix}"
+            for fov in self._ez_seg_files["fov_names"]
+            for merged_mask_suffix in self._ez_seg_files["merged_mask_suffixes"]
+        ]
+        assert set(actual_merged_names) == set(downloaded_merged_names)
+
+        # final masks check
+        downloaded_final = list(final_masks.glob("*.tiff"))
+        downloaded_final_names = [f.stem for f in downloaded_final]
+        actual_final_names = [
+            f"{fov}_{final_mask_suffix}"
+            for fov in self._ez_seg_files["fov_names"]
+            for final_mask_suffix in self._ez_seg_files["final_mask_suffixes"]
+        ]
+        assert set(actual_final_names) == set(downloaded_final_names)
+
+        # logs check
+        downloaded_logs = list(logs.glob("*.txt"))
+        downloaded_log_names = [f.stem for f in downloaded_logs]
+        assert set(self._ez_seg_files["log_names"]) == set(downloaded_log_names)
+
+    def _suffix_paths(self, dataset_download: ExampleDataset,
+                      parent_dir: pathlib.Path) -> Generator:
+        """
+        Creates a generator where each element is a tuple of the data directory
+        and the dataset name.
+
+        Args:
+            dataset_download (ExampleDataset): Fixture for the dataset, respective to each
+            partition (`segment_image_data`, `cluster_pixels`, `cluster_cells`,
+            `post_clustering`).
+            parent_dir (pathlib.Path): The path where the example dataset will be saved.
+
+        Yields:
+            Generator: Yields the data directory for the files to be moved, and the dataset name.
+        """
+        dataset_names = list(
+            dataset_download.dataset_paths[dataset_download.dataset].keys()
+        )
+
+        ds_n_suffixes = [self.move_path_suffixes[ds_n] for ds_n in dataset_names]
+        for ds_n_suffix, ds_n in zip(ds_n_suffixes, dataset_names):
+            yield (parent_dir / ds_n_suffix, ds_n)