From 442f6a9883e3e656e41cdaa2147f0dba914ee2e9 Mon Sep 17 00:00:00 2001 From: kodda Date: Wed, 17 Mar 2021 18:20:03 +0100 Subject: [PATCH 1/5] binary segment --- docs/Scanner/explanations/segmentation.md | 63 +++++++---------------- 1 file changed, 18 insertions(+), 45 deletions(-) diff --git a/docs/Scanner/explanations/segmentation.md b/docs/Scanner/explanations/segmentation.md index ee844298..8302ce1e 100644 --- a/docs/Scanner/explanations/segmentation.md +++ b/docs/Scanner/explanations/segmentation.md @@ -53,10 +53,10 @@ the weights can then be retrieved as *clf.coef_* and the threshold as *-clf.inte upstream_task = "ImagesFilesetExists" # other option "Undistorted" type = "linear" parameters = "[0,1,0]" -threshold = 0.5 -#Optional arguments dilation = 0 -query = "{\"channel\":\"rgb\"}" #This is optional, necessary when the *ImageFileset* contains multiple channels (typically when it is produced from a virtual scan) +binarize = true +threshold = 0.5 +query = "{\"channel\":\"rgb\"}" #This is optional, useful when the *ImageFileset* contains multiple channels (typically when it is produced from a virtual scan) ``` @@ -88,66 +88,39 @@ type = "excess_green" dilation = 0 binarize = true threshold = 0.2 -query = "{\"channel\":\"rgb\"}" #This is optional, necessary when the *ImageFileset* contains multiple channels (typically when it is produced from a virtual scan) +query = "{\"channel\":\"rgb\"}" #This is optional, useful when the *ImageFileset* contains multiple channels (typically when it is produced from a virtual scan) ``` -### Inversion - -For an index I, if you want to use $1-I$ for creating the mask, set *invert* to *True*. - -##Multi-class segmentation +#### Vesselness -The *Segmentation2D* task performs the semantic segmentation of images using a deep neural network (DNN). The command to run this task is: +!!! danger + BROKEN the task calls the function vesselness with a *channel* argument which is not in the definition of the vesselness function. It should be repaired or removed -```bash -romi_run_task Segmentation2D scan_id my_config.toml -``` -This will produce a series of binary masks, one for each class on which the network was trained. +The two previous methods wre based only on color. Instead, here, we consider differential information by relying on the Hessian matrix. The vesselness index is computed according to the method described in [mevislab](https://mevislabdownloads.mevis.de/docs/current/FMEstable/ReleaseMeVis/Documentation/Publish/ModuleReference/Vesselness.html). -
-U-net architecture -
Generic encoder/decoder architecture for semantic segmentation (U-net).
-
-The architecture of the network is inspired from the U-net [ref], with a ResNet encoder [ref]. It constists in encoding and decoding pathways with skip connections between the 2. +### Binarization -####Configuration File - -```toml -[Segmentation2D] -upstream_task = "ImageFilesetExists" #Alternatively Undistorted -model_fileset = "ModelFileset" -model_id = "Resnet_896_896_epoch50" # no default value -query = "{\"channel\":\"rgb\"}" # default is an empty dict '{}' -Sx = 896 -Sy = 896 -labels = "[]" # default is empty list to use all trained labels from model -inverted_labels = "[\"background\"]" -threshold = 0.01 -``` - - -### DNN model - -The neural architecture weights are obtained through training on an annotated dataset (see How to train a DNN for semantic segmentation). Those weights should be stored in the database (at `/models/models`) and the name of the weights file should be provided as the *model_id* parameter in the configuration. You can use our model trained on virtual arabidopsis [here](https://media.romi-project.eu/data/Resnetdataset_gl_png_896_896_epoch50.pt) - -## Binarization - -A binary mask $m$ is produced from the index or from the output of the DNN, *I*, by applying a threshold $\theta$ on I for each pixel $(i,j)$: +If the *binarize* parameter is set to *True*, a binary mask $m$ is produced from the index *I* by applying a threshold $\theta$ on I for each pixel $(i,j)$: \begin{equation} m_{ij} = \begin{cases} - 255 & \text{if $I_{ij}>\theta$}\\ + 1 & \text{if $I_{ij}>\theta$}\\ 0 & \text{otherwise} \end{cases} \end{equation} - -## Dilation +### Dilation If the integer *dilation* parameter is non-zero a morphological dilation is apllied to the image using the function [*binary_dilation*](https://scikit-image.org/docs/dev/api/skimage.morphology.html#skimage.morphology.binary_dilation) from the *skimage.morphology* module. The *dilation* parameter sets the number of times *binary_dilation* is iteratively applied. For a faithful reconstruction this parameter should be set to $0$ but in practice you may want to have a coarser point cloud. This is true when your segmentation is not perfect, dilation will fill the holes or when the reconstructed mesh is broken because the pôint cloud is too thin. +### Inversion + +For an index I, if you want to use $1-I$, set *invert* to *True*. + + +##Multi-class segmentation \ No newline at end of file From addd553d9743f2546a306bb3489e4ac3027a45b9 Mon Sep 17 00:00:00 2001 From: kodda Date: Thu, 18 Mar 2021 11:47:00 +0100 Subject: [PATCH 2/5] multi-class segmentation --- docs/Scanner/explanations/segmentation.md | 63 ++++++++++++++++------- 1 file changed, 45 insertions(+), 18 deletions(-) diff --git a/docs/Scanner/explanations/segmentation.md b/docs/Scanner/explanations/segmentation.md index 8302ce1e..ee844298 100644 --- a/docs/Scanner/explanations/segmentation.md +++ b/docs/Scanner/explanations/segmentation.md @@ -53,10 +53,10 @@ the weights can then be retrieved as *clf.coef_* and the threshold as *-clf.inte upstream_task = "ImagesFilesetExists" # other option "Undistorted" type = "linear" parameters = "[0,1,0]" -dilation = 0 -binarize = true threshold = 0.5 -query = "{\"channel\":\"rgb\"}" #This is optional, useful when the *ImageFileset* contains multiple channels (typically when it is produced from a virtual scan) +#Optional arguments +dilation = 0 +query = "{\"channel\":\"rgb\"}" #This is optional, necessary when the *ImageFileset* contains multiple channels (typically when it is produced from a virtual scan) ``` @@ -88,39 +88,66 @@ type = "excess_green" dilation = 0 binarize = true threshold = 0.2 -query = "{\"channel\":\"rgb\"}" #This is optional, useful when the *ImageFileset* contains multiple channels (typically when it is produced from a virtual scan) +query = "{\"channel\":\"rgb\"}" #This is optional, necessary when the *ImageFileset* contains multiple channels (typically when it is produced from a virtual scan) ``` +### Inversion + +For an index I, if you want to use $1-I$ for creating the mask, set *invert* to *True*. + -#### Vesselness +##Multi-class segmentation -!!! danger - BROKEN the task calls the function vesselness with a *channel* argument which is not in the definition of the vesselness function. It should be repaired or removed +The *Segmentation2D* task performs the semantic segmentation of images using a deep neural network (DNN). The command to run this task is: -The two previous methods wre based only on color. Instead, here, we consider differential information by relying on the Hessian matrix. The vesselness index is computed according to the method described in [mevislab](https://mevislabdownloads.mevis.de/docs/current/FMEstable/ReleaseMeVis/Documentation/Publish/ModuleReference/Vesselness.html). +```bash +romi_run_task Segmentation2D scan_id my_config.toml +``` +This will produce a series of binary masks, one for each class on which the network was trained. +
+U-net architecture +
Generic encoder/decoder architecture for semantic segmentation (U-net).
+
-### Binarization +The architecture of the network is inspired from the U-net [ref], with a ResNet encoder [ref]. It constists in encoding and decoding pathways with skip connections between the 2. -If the *binarize* parameter is set to *True*, a binary mask $m$ is produced from the index *I* by applying a threshold $\theta$ on I for each pixel $(i,j)$: +####Configuration File + +```toml +[Segmentation2D] +upstream_task = "ImageFilesetExists" #Alternatively Undistorted +model_fileset = "ModelFileset" +model_id = "Resnet_896_896_epoch50" # no default value +query = "{\"channel\":\"rgb\"}" # default is an empty dict '{}' +Sx = 896 +Sy = 896 +labels = "[]" # default is empty list to use all trained labels from model +inverted_labels = "[\"background\"]" +threshold = 0.01 +``` + + +### DNN model + +The neural architecture weights are obtained through training on an annotated dataset (see How to train a DNN for semantic segmentation). Those weights should be stored in the database (at `/models/models`) and the name of the weights file should be provided as the *model_id* parameter in the configuration. You can use our model trained on virtual arabidopsis [here](https://media.romi-project.eu/data/Resnetdataset_gl_png_896_896_epoch50.pt) + +## Binarization + +A binary mask $m$ is produced from the index or from the output of the DNN, *I*, by applying a threshold $\theta$ on I for each pixel $(i,j)$: \begin{equation} m_{ij} = \begin{cases} - 1 & \text{if $I_{ij}>\theta$}\\ + 255 & \text{if $I_{ij}>\theta$}\\ 0 & \text{otherwise} \end{cases} \end{equation} -### Dilation + +## Dilation If the integer *dilation* parameter is non-zero a morphological dilation is apllied to the image using the function [*binary_dilation*](https://scikit-image.org/docs/dev/api/skimage.morphology.html#skimage.morphology.binary_dilation) from the *skimage.morphology* module. The *dilation* parameter sets the number of times *binary_dilation* is iteratively applied. For a faithful reconstruction this parameter should be set to $0$ but in practice you may want to have a coarser point cloud. This is true when your segmentation is not perfect, dilation will fill the holes or when the reconstructed mesh is broken because the pôint cloud is too thin. -### Inversion - -For an index I, if you want to use $1-I$, set *invert* to *True*. - - -##Multi-class segmentation \ No newline at end of file From fabc9f0781df9d01a5b24ee3af478f005ee1454a Mon Sep 17 00:00:00 2001 From: kodda Date: Fri, 19 Mar 2021 16:26:27 +0100 Subject: [PATCH 3/5] completed segmentation doc --- docs/Scanner/explanations/segmentation.md | 35 ++++++++++++----------- 1 file changed, 19 insertions(+), 16 deletions(-) diff --git a/docs/Scanner/explanations/segmentation.md b/docs/Scanner/explanations/segmentation.md index ee844298..05241119 100644 --- a/docs/Scanner/explanations/segmentation.md +++ b/docs/Scanner/explanations/segmentation.md @@ -54,8 +54,7 @@ upstream_task = "ImagesFilesetExists" # other option "Undistorted" type = "linear" parameters = "[0,1,0]" threshold = 0.5 -#Optional arguments -dilation = 0 +#Optional parameters query = "{\"channel\":\"rgb\"}" #This is optional, necessary when the *ImageFileset* contains multiple channels (typically when it is produced from a virtual scan) ``` @@ -86,16 +85,10 @@ $$ upstream_task = "ImagesFilesetExists" # other option "Undistorted" type = "excess_green" dilation = 0 -binarize = true threshold = 0.2 query = "{\"channel\":\"rgb\"}" #This is optional, necessary when the *ImageFileset* contains multiple channels (typically when it is produced from a virtual scan) ``` -### Inversion - -For an index I, if you want to use $1-I$ for creating the mask, set *invert* to *True*. - - ##Multi-class segmentation The *Segmentation2D* task performs the semantic segmentation of images using a deep neural network (DNN). The command to run this task is: @@ -110,24 +103,22 @@ This will produce a series of binary masks, one for each class on which the netw
Generic encoder/decoder architecture for semantic segmentation (U-net).
-The architecture of the network is inspired from the U-net [ref], with a ResNet encoder [ref]. It constists in encoding and decoding pathways with skip connections between the 2. +The architecture of the network is inspired from the U-net [^1], with a ResNet encoder [^2]. It constists in encoding and decoding pathways with skip connections between the 2. The network is trained for segmenting images of a size $(S_x,S_y)$ which is not necessarily the image size of the acquired images. Those parameters *Sx* and *Sy* should be provided in the configuration file. The images will be cropped to $(S_x,S_y)$ before being fed to the DNN and it is then resized to the original size as an output of the task. + +[^1]: Ronneberger, O., Fischer, P., & Brox, T. (2015, October). U-net: Convolutional networks for biomedical image segmentation. In International Conference on Medical image computing and computer-assisted intervention (pp. 234-241). Springer, Cham. + +[^2]: Zhang, Z., Liu, Q., & Wang, Y. (2018). Road extraction by deep residual u-net. IEEE Geoscience and Remote Sensing Letters, 15(5), 749-753. ####Configuration File ```toml [Segmentation2D] -upstream_task = "ImageFilesetExists" #Alternatively Undistorted -model_fileset = "ModelFileset" model_id = "Resnet_896_896_epoch50" # no default value -query = "{\"channel\":\"rgb\"}" # default is an empty dict '{}' Sx = 896 Sy = 896 -labels = "[]" # default is empty list to use all trained labels from model -inverted_labels = "[\"background\"]" threshold = 0.01 ``` - ### DNN model The neural architecture weights are obtained through training on an annotated dataset (see How to train a DNN for semantic segmentation). Those weights should be stored in the database (at `/models/models`) and the name of the weights file should be provided as the *model_id* parameter in the configuration. You can use our model trained on virtual arabidopsis [here](https://media.romi-project.eu/data/Resnetdataset_gl_png_896_896_epoch50.pt) @@ -144,10 +135,22 @@ A binary mask $m$ is produced from the index or from the output of the DNN, *I*, \end{cases} \end{equation} +This threshold may be chosen empirically or it may be learnt from annotated data (see linear SVM section). ## Dilation -If the integer *dilation* parameter is non-zero a morphological dilation is apllied to the image using the function [*binary_dilation*](https://scikit-image.org/docs/dev/api/skimage.morphology.html#skimage.morphology.binary_dilation) from the *skimage.morphology* module. +If the integer *dilation* parameter is non-zero a morphological dilation is apllied to the image using the function [*binary_dilation*](https://scikit-image.org/docs/dev/api/skimage.morphology.html#skimage.morphology.binary_dilation) from the *skimage.morphology* module. The *dilation* parameter sets the number of times *binary_dilation* is iteratively applied. For a faithful reconstruction this parameter should be set to $0$ but in practice you may want to have a coarser point cloud. This is true when your segmentation is not perfect, dilation will fill the holes or when the reconstructed mesh is broken because the pôint cloud is too thin. +## Working with data from the virtual scanner + +When working with data generated with the virtual scanner, the *images* folder contains multiple channels corresponding to the various class for which images were generated (*stem*, *flower*, *fruit*, *leaf*, *pedicel*). You have to select the *rgb* channel using the *query* parameter. + +####Configuration File +```toml +[Masks] +type = "excess_green" +threshold = 0.2 +query = "{\"channel\":\"rgb\"}" +``` From ce0593c3e813d0f1148cb09c2516673f7dedbbd8 Mon Sep 17 00:00:00 2001 From: kodda Date: Fri, 19 Mar 2021 16:34:22 +0100 Subject: [PATCH 4/5] completed segmentation doc --- docs/Scanner/explanations/segmentation.md | 14 ++++++-------- 1 file changed, 6 insertions(+), 8 deletions(-) diff --git a/docs/Scanner/explanations/segmentation.md b/docs/Scanner/explanations/segmentation.md index 05241119..e2e341d2 100644 --- a/docs/Scanner/explanations/segmentation.md +++ b/docs/Scanner/explanations/segmentation.md @@ -1,7 +1,7 @@ Segmentation of images === -The segmentation of an image consists in assigning a label to each of its pixels. For the 3d reconstruction of a plant, we need at least the segmentation of the images into 2 classes: *plant* and *backround*. For a reconstruction with semantic labeling of the point cloud, we will need a semantic segmentation of the images giving one label for each organ type (e.g. {*leaf*, *stem*,*pedicel*, *flower*, *fruit*}). Figures shows describe the binary and multi-class segmentations for a virtual plant. +The segmentation of an image consists in assigning a label to each of its pixels. For the 3d reconstruction of a plant, we need at least the segmentation of the images into 2 classes: *plant* and *backround*. For a reconstruction with semantic labeling of the point cloud, we will need a semantic segmentation of the images giving one label for each organ type (e.g. {*leaf*, *stem*,*pedicel*, *flower*, *fruit*}). The figure below shows the binary and multi-class segmentations for a virtual plant.
Binary and multi-class segmentation examples @@ -16,9 +16,9 @@ The binary segmentation of an image into *plant* and *background* is performed w ```bash romi_run_task Masks scan_id --config myconfig.toml ``` -with upstream task being *ImagesFilesetExists* when processing the raw RGB images or *Undistorded* when processing images corrected using the intrinsic parameters of the camera. The task takes this set of images as an input and produce either binary mask or real valued maps depending on parameters. +with upstream task being *ImagesFilesetExists* when processing the raw RGB images or *Undistorded* when processing images corrected using the intrinsic parameters of the camera. The task takes this set of images as an input and produce one binary mask for each image. -There are 3 methods available to compute indices for binary segmentation: Excess Green Index, Linear SVM or Vesselness. For each method, we provide an example configuration file in the *Index computation* section. +There are 2 methods available to compute indices for binary segmentation: Excess Green Index and Linear SVM. For each method, we provide an example configuration file in the *Index computation* section. ### Index computation @@ -31,11 +31,11 @@ $$ S_{ij}=w_0 R_{ij} + w_1 G_{ij} +w_2 B_{ij} $$ -where $w$ is the *parameter* vector specified in the configuration file. A simple vector, like $w=(0,1,0)$ may be used. +where $w$ is the *parameters* vector specified in the configuration file. A simple vector, like $w=(0,1,0)$ may be used for example. -Alternatively you can train an SVM to learn those weights and the threshold to be provided in the configuration file. For this, we consider you have a sample image and a ground truth binary mask. A ground may be produced using a manual annotation tool like [LabelMe](https://github.com/wkentaro/labelme). +Alternatively, you can train an SVM to learn those weights and the threshold to be provided in the configuration file. For this, we consider you have a sample image and a ground truth binary mask. A ground truth may be produced using a manual annotation tool like [LabelMe](https://github.com/wkentaro/labelme). -Using for example a list of 1000 randomly selected pixels as $X_{train}$ and their corresponding labels as $Y_{train}$, a linear SVM is trained using +Using for example a list of N randomly selected pixels as $X_{train}$ (array of size [N,3]) and their corresponding labels as $Y_{train}$ (array of size N), a linear SVM is trained using ```python from sklearn import svm @@ -54,8 +54,6 @@ upstream_task = "ImagesFilesetExists" # other option "Undistorted" type = "linear" parameters = "[0,1,0]" threshold = 0.5 -#Optional parameters -query = "{\"channel\":\"rgb\"}" #This is optional, necessary when the *ImageFileset* contains multiple channels (typically when it is produced from a virtual scan) ``` From 9dec9c558754f5810580b488d9dd5595eb6136a6 Mon Sep 17 00:00:00 2001 From: kodda Date: Fri, 19 Mar 2021 16:42:48 +0100 Subject: [PATCH 5/5] completed segmentation doc 2 --- docs/Scanner/explanations/segmentation.md | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/docs/Scanner/explanations/segmentation.md b/docs/Scanner/explanations/segmentation.md index e2e341d2..e5e7df86 100644 --- a/docs/Scanner/explanations/segmentation.md +++ b/docs/Scanner/explanations/segmentation.md @@ -82,9 +82,7 @@ $$ [Masks] upstream_task = "ImagesFilesetExists" # other option "Undistorted" type = "excess_green" -dilation = 0 threshold = 0.2 -query = "{\"channel\":\"rgb\"}" #This is optional, necessary when the *ImageFileset* contains multiple channels (typically when it is produced from a virtual scan) ``` ##Multi-class segmentation @@ -101,7 +99,9 @@ This will produce a series of binary masks, one for each class on which the netw
Generic encoder/decoder architecture for semantic segmentation (U-net).
-The architecture of the network is inspired from the U-net [^1], with a ResNet encoder [^2]. It constists in encoding and decoding pathways with skip connections between the 2. The network is trained for segmenting images of a size $(S_x,S_y)$ which is not necessarily the image size of the acquired images. Those parameters *Sx* and *Sy* should be provided in the configuration file. The images will be cropped to $(S_x,S_y)$ before being fed to the DNN and it is then resized to the original size as an output of the task. +The architecture of the network is inspired from the U-net [^1], with a ResNet encoder [^2]. It constists in encoding and decoding pathways with skip connections between the 2. Along the encoding pathways, there is a sequence of convolutions and the image signal is upsampled along the decoding pathway. + +The network is trained for segmenting images of a size $(S_x,S_y)$ which is not necessarily the image size of the acquired images. Those parameters *Sx* and *Sy* should be provided in the configuration file. The images will be cropped to $(S_x,S_y)$ before being fed to the DNN and it is then resized to the original size as an output of the task. [^1]: Ronneberger, O., Fischer, P., & Brox, T. (2015, October). U-net: Convolutional networks for biomedical image segmentation. In International Conference on Medical image computing and computer-assisted intervention (pp. 234-241). Springer, Cham. @@ -111,7 +111,7 @@ The architecture of the network is inspired from the U-net [^1], with a ResNet e ```toml [Segmentation2D] -model_id = "Resnet_896_896_epoch50" # no default value +model_id = "Resnetdataset_gl_png_896_896_epoch50" # no default value Sx = 896 Sy = 896 threshold = 0.01