From 23e64fedb03a171999c7c178739146b3ce2d1266 Mon Sep 17 00:00:00 2001
From: Alex Zwanenburg <alexander.zwanenburg@nct-dresden.de>
Date: Tue, 2 Apr 2024 17:26:34 +0200
Subject: [PATCH] Extended quick-start section

#69
---
 docs_source/source/quick_start.rst | 87 +++++++++++++++++++++++++++---
 test/documentation_example_test.py | 48 +++++++++++++++++
 2 files changed, 128 insertions(+), 7 deletions(-)

diff --git a/docs_source/source/quick_start.rst b/docs_source/source/quick_start.rst
index c683d6dd..9290dfa7 100644
--- a/docs_source/source/quick_start.rst
+++ b/docs_source/source/quick_start.rst
@@ -7,17 +7,20 @@ Before you begin, you need to:
 
 Computing quantitative features
 -------------------------------
-Suppose you have a dataset of computed tomography (CT) DICOM images with corresponding segmentations. Suppose that both
-images and masks are located split by patient directories ``path/to/data``. For each patient, the CT image is in the
-``image`` directory, and its corresponding segmentation in ``mask``. For patient ``patient_003``, the full path to the
+Suppose you have a dataset of computed tomography (CT) DICOM images with corresponding segmentation masks that you want
+to use to compute quantitative features from. Now, suppose that both images and masks are seperated by patient
+directories within a general ``path/to/data`` folder. For each patient, the CT image is in the ``image`` directory,
+and its corresponding segmentation in ``mask``. For patient ``patient_003``, the full path to the
 image directory is ``path/to/data/patient_003/image``, and to the mask directory is ``path/to/data/patient_003/mask``.
 
-We want to compute features from the gross tumour mask (called ``GTV``). We are interested in the soft-tissue range,
-with Hounsfield Units between -150 and 200 HU. To harmonise differences in resolution and slice distance
+We want to compute features from a pre-defined gross tumour mask (called ``GTV``). We are interested in the soft-tissue
+range, with Hounsfield Units between -150 and 200 HU. To harmonise differences in resolution and slice distance
 between CT images from different patients, all voxels are resampled to a 1.0 by 1.0 by 1.0 mm size. Histogram and
 texture features are computed after discretisation using the `fixed bin size` method with a bin size of 25 Hounsfield
 Units.
 
+MIRP can compute quantitative features using the function call below:
+
 .. code-block:: python
 
     import pandas as pd
@@ -35,8 +38,8 @@ Units.
         base_discretisation_bin_width=25.0
     )
 
-The above code results in ``feature_data``, a list of ``pandas.DataFrame`` that contains feature values for every
-patient. These can combined into a single ``pandas.DataFrame`` as follows:
+The above code results in ``feature_data`` which is a list of ``pandas.DataFrame`` that contains feature values for
+every patient. These can combined into a single ``pandas.DataFrame`` as follows:
 
 .. code-block:: python
 
@@ -44,4 +47,74 @@ patient. These can combined into a single ``pandas.DataFrame`` as follows:
 
 Computing quantitative features from filtered images
 ----------------------------------------------------
+Image filters enhance aspects such as edges, blobs and directional structures. MIRP supports several filters (see
+:ref:`quantitative_image_analysis`). Suppose you want to use a Laplacian-of-Gaussian filter, with the width of the
+Gaussian equal to 2.0 mm.
+
+We can first inspect the images visually using ``extract_images``. By default, ``export_images`` exports images and
+masks as dictionary with ``numpy`` data and metadata (or as NIfTI files, in case ``write_dir`` is provided). However,
+MIRP has a simple viewer for its own internal format. To use this viewer, you can set ``image_export_format =
+"native"``.
+
+.. code-block:: python
+
+    from mirp import extract_images
+
+    images = extract_images(
+        image="path/to/data",
+        mask="path/to/data",
+        image_sub_folder="image",
+        mask_sub_folder="mask",
+        roi_name="GTV",
+        new_spacing=1.0,
+        resegmentation_intensity_range=[-150.0, 200.0],
+        filter_kernels="laplacian_of_gaussian",
+        laplacian_of_gaussian_sigma=2.0,
+        image_export_format="native"
+    )
+
+Here, ``images`` is a list of images and masks, with one entry for each patient. Each entry consist of two nested
+lists, one for images and the second for masks. In this case, the nested list of images contains two entries, and
+that of masks only one (for the ``GTV`` region of interest). The first image is the CT image, after interpolation to
+1.0 by 1.0 by 1.0 mm voxels. The second image is the Laplacian-of-Gaussian filtered image. Each image can be viewed
+using the ``show`` method:
+
+.. code-block:: python
+    patient_1_images, patient_1_mask = images[0]
+    patient_1_ct_image, patient_1_log_image = patient_1_images
+
+    # View the CT image
+    patient_1_ct_image.show()
+
+    # View the Laplacian-of-Gaussian filtered image
+    patient_1_log_image.show()
+
+Of course, features can also be computed from filtered images (also called response maps). By default, only
+statistical features [Zwanenburg2016]_ are computed from filtered images.
+
+.. code-block:: python
+
+    import pandas as pd
+    from mirp import extract_features
+
+    feature_data = extract_features(
+        image="path/to/data",
+        mask="path/to/data",
+        image_sub_folder="image",
+        mask_sub_folder="mask",
+        roi_name="GTV",
+        new_spacing=1.0,
+        resegmentation_intensity_range=[-150.0, 200.0],
+        base_discretisation_method="fixed_bin_size",
+        base_discretisation_bin_width=25.0,
+        filter_kernels="laplacian_of_gaussian",
+        laplacian_of_gaussian_sigma=2.0
+    )
+
+    feature_data = pd.concat(feature_data)
+
 
+References
+----------
+.. [Zwanenburg2016] Zwanenburg A, Leger S, Vallieres M, Loeck S. Image biomarker standardisation initiative. arXiv
+  [cs.CV] 2016. doi:10.48550/arXiv.1612.070035
\ No newline at end of file
diff --git a/test/documentation_example_test.py b/test/documentation_example_test.py
index bf2b5fb6..52c5d4da 100644
--- a/test/documentation_example_test.py
+++ b/test/documentation_example_test.py
@@ -6,6 +6,8 @@
 
 
 def test_quick_start():
+
+    # Quick-start example 1 (extract features)
     from mirp import extract_features
 
     feature_data = extract_features(
@@ -24,6 +26,52 @@ def test_quick_start():
 
     assert len(feature_data) == 3
 
+    # Quick start example 2 (view filtered images)
+    from mirp._images.ct_image import CTImage
+    from mirp._images.transformed_image import LaplacianOfGaussianTransformedImage
+    from mirp import extract_images
+
+    images = extract_images(
+        image=os.path.join(CURRENT_DIR, "data", "sts_images"),
+        mask=os.path.join(CURRENT_DIR, "data", "sts_images"),
+        image_sub_folder=os.path.join("CT", "dicom", "image"),
+        mask_sub_folder=os.path.join("CT", "dicom", "mask"),
+        roi_name="GTV_Mass_CT",
+        new_spacing=1.0,
+        resegmentation_intensity_range=[-150.0, 200.0],
+        filter_kernels="laplacian_of_gaussian",
+        laplacian_of_gaussian_sigma=2.0,
+        image_export_format="native"
+    )
+
+    patient_1_images, patient_1_mask = images[0]
+    patient_1_ct_image, patient_1_log_image = patient_1_images
+
+    assert len(images) == 3
+    assert isinstance(patient_1_ct_image, CTImage)
+    assert isinstance(patient_1_log_image, LaplacianOfGaussianTransformedImage)
+
+    # Quick start example 3 (features from filtered images).
+    from mirp import extract_features
+
+    feature_data = extract_features(
+        image=os.path.join(CURRENT_DIR, "data", "sts_images"),
+        mask=os.path.join(CURRENT_DIR, "data", "sts_images"),
+        image_sub_folder=os.path.join("CT", "dicom", "image"),
+        mask_sub_folder=os.path.join("CT", "dicom", "mask"),
+        roi_name="GTV_Mass_CT",
+        new_spacing=1.0,
+        resegmentation_intensity_range=[-150.0, 200.0],
+        base_discretisation_method="fixed_bin_size",
+        base_discretisation_bin_width=25.0,
+        filter_kernels="laplacian_of_gaussian",
+        laplacian_of_gaussian_sigma=2.0
+    )
+
+    feature_data = pd.concat(feature_data)
+
+    assert len(feature_data) == 3
+
 
 def test_extract_features_examples():
     from mirp import extract_features