SOMExample.cxxΒΆ
Example usage:
./SOMExample Input/ROI_QB_MUL_1.png Output/ROI_QB_MUL_SOM.png Output/ROI_QB_MUL_SOMACT.png 4 4 4 4 20 1.0 0.1 128
Example source code (SOMExample.cxx):
/*
* Copyright (C) 2005-2019 Centre National d'Etudes Spatiales (CNES)
* Copyright (C) 2007-2012 Institut Mines Telecom / Telecom Bretagne
*
* This file is part of Orfeo Toolbox
*
* https://www.orfeo-toolbox.org/
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
// This example illustrates the use of the
// \doxygen{otb}{SOM} class for building Kohonen's Self Organizing
// Maps.
//
// We will use the SOM in order to build a color table from an input
// image. Our input image is coded with $3\times 8$ bits and we would
// like to code it with only 16 levels. We will use the SOM in order
// to learn which are the 16 most representative RGB values of the
// input image and we will assume that this is the optimal color table
// for the image.
//
// The first thing to do is include the header file for the
// class. We will also need the header files for the map itself and
// the activation map builder whose utility will be explained at the
// end of the example.
//
#include "otbSOMMap.h"
#include "otbSOM.h"
#include "otbSOMActivationBuilder.h"
#include "itkMacro.h"
#include "itkVectorExpandImageFilter.h"
#include "itkVectorNearestNeighborInterpolateImageFunction.h"
#include "itkExpandImageFilter.h"
#include "itkNearestNeighborInterpolateImageFunction.h"
#include "otbPerBandVectorImageFilter.h"
#include "otbPrintableImageFilter.h"
// Since the \doxygen{otb}{SOM} class uses a distance, we will need to
// include the header file for the one we want to use
//
#include "otbImageFileReader.h"
#include "otbImageFileWriter.h"
#include "itkListSample.h"
int main(int itkNotUsed(argc), char* argv[])
{
const char* inputFileName = argv[1];
const char* outputFileName = argv[2];
const char* actMapFileName = argv[3];
unsigned int sizeX = atoi(argv[4]);
unsigned int sizeY = atoi(argv[5]);
unsigned int neighInitX = atoi(argv[6]);
unsigned int neighInitY = atoi(argv[7]);
unsigned int nbIterations = atoi(argv[8]);
double betaInit = atof(argv[9]);
double betaEnd = atof(argv[10]);
double initValue = atof(argv[11]);
// The Self Organizing Map itself is actually an N-dimensional image
// where each pixel contains a neuron. In our case, we decide to build
// a 2-dimensional SOM, where the neurons store RGB values with
// floating point precision.
const unsigned int Dimension = 2;
using PixelType = double;
using ImageType = otb::VectorImage<PixelType, Dimension>;
using VectorType = ImageType::PixelType;
// The distance that we want to apply between the RGB values is the
// Euclidean one. Of course we could choose to use other type of
// distance, as for instance, a distance defined in any other color space.
using DistanceType = itk::Statistics::EuclideanDistanceMetric<VectorType>;
//
// We can now define the type for the map. The \doxygen{otb}{SOMMap}
// class is templated over the neuron type -- \code{PixelType} here
// --, the distance type and the number of dimensions. Note that the
// number of dimensions of the map could be different from the one of
// the images to be processed.
using MapType = otb::SOMMap<VectorType, DistanceType, Dimension>;
//
// We are going to perform the learning directly on the pixels of the
// input image. Therefore, the image type is defined using the same
// pixel type as we used for the map. We also define the type for the
// imge file reader.
using ReaderType = otb::ImageFileReader<ImageType>;
//
// Since the \doxygen{otb}{SOM} class works on lists of samples, it
// will need to access the input image through an adaptor. Its type is
// defined as follows:
using SampleListType = itk::Statistics::ListSample<VectorType>;
//
// We can now define the type for the SOM, which is templated over the
// input sample list and the type of the map to be produced and the two
// functors that hold the training behavior.
using LearningBehaviorFunctorType = otb::Functor::CzihoSOMLearningBehaviorFunctor;
using NeighborhoodBehaviorFunctorType = otb::Functor::CzihoSOMNeighborhoodBehaviorFunctor;
using SOMType = otb::SOM<SampleListType, MapType, LearningBehaviorFunctorType, NeighborhoodBehaviorFunctorType>;
//
// As an alternative to standard \code{SOMType}, one can decide to use
// an \doxygen{otb}{PeriodicSOM}, which behaves like \doxygen{otb}{SOM} but
// is to be considered to as a torus instead of a simple map. Hence, the
// neighborhood behavior of the winning neuron does not depend on its location
// on the map...
// \doxygen{otb}{PeriodicSOM} is defined in otbPeriodicSOM.h.
//
// We can now start building the pipeline. The first step is to
// instantiate the reader and pass its output to the adaptor.
ReaderType::Pointer reader = ReaderType::New();
reader->SetFileName(inputFileName);
reader->Update();
SampleListType::Pointer sampleList = SampleListType::New();
sampleList->SetMeasurementVectorSize(reader->GetOutput()->GetVectorLength());
itk::ImageRegionIterator<ImageType> imgIter(reader->GetOutput(), reader->GetOutput()->GetBufferedRegion());
imgIter.GoToBegin();
itk::ImageRegionIterator<ImageType> imgIterEnd(reader->GetOutput(), reader->GetOutput()->GetBufferedRegion());
imgIterEnd.GoToEnd();
do
{
sampleList->PushBack(imgIter.Get());
++imgIter;
} while (imgIter != imgIterEnd);
//
// We can now instantiate the SOM algorithm and set the sample list as input.
SOMType::Pointer som = SOMType::New();
som->SetListSample(sampleList);
//
// We use a \code{SOMType::SizeType} array in order to set the sizes
// of the map.
SOMType::SizeType size;
size[0] = sizeX;
size[1] = sizeY;
som->SetMapSize(size);
//
// The initial size of the neighborhood of each neuron is set in the
// same way.
SOMType::SizeType radius;
radius[0] = neighInitX;
radius[1] = neighInitY;
som->SetNeighborhoodSizeInit(radius);
//
// The other parameters are the number of iterations, the initial and
// the final values for the learning rate -- $\beta$ -- and the
// maximum initial value for the neurons (the map will be randomly
// initialized).
som->SetNumberOfIterations(nbIterations);
som->SetBetaInit(betaInit);
som->SetBetaEnd(betaEnd);
som->SetMaxWeight(static_cast<PixelType>(initValue));
//
// Now comes the initialization of the functors.
LearningBehaviorFunctorType learningFunctor;
learningFunctor.SetIterationThreshold(radius, nbIterations);
som->SetBetaFunctor(learningFunctor);
NeighborhoodBehaviorFunctorType neighborFunctor;
som->SetNeighborhoodSizeFunctor(neighborFunctor);
som->Update();
//
// Finally, we set up the las part of the pipeline where the plug the
// output of the SOM into the writer. The learning procedure is
// triggered by calling the \code{Update()} method on the writer.
// Since the map is itself an image, we can write it to disk with an
// \doxygen{otb}{ImageFileWriter}.
// Just for visualization purposes, we zoom the image, and pass it to the printable image filter
using SingleImageType = otb::Image<PixelType, 2>;
using ExpandType = itk::ExpandImageFilter<SingleImageType, SingleImageType>;
using VectorExpandType = otb::PerBandVectorImageFilter<MapType, MapType, ExpandType>;
using InterpolatorType = itk::NearestNeighborInterpolateImageFunction<SingleImageType, double>;
using PrintableFilterType = otb::PrintableImageFilter<MapType>;
using PrintableWriterType = otb::ImageFileWriter<PrintableFilterType::OutputImageType>;
InterpolatorType::Pointer interpolator = InterpolatorType::New();
VectorExpandType::Pointer expand = VectorExpandType::New();
ExpandType::Pointer scalarExpand = ExpandType::New();
scalarExpand->SetExpandFactors(40);
scalarExpand->SetInterpolator(interpolator);
// scalarExpand->SetEdgePaddingValue(255);
expand->SetFilter(scalarExpand);
expand->SetInput(som->GetOutput());
expand->UpdateOutputInformation();
PrintableFilterType::Pointer printFilter = PrintableFilterType::New();
printFilter->SetInput(expand->GetOutput());
printFilter->SetChannel(1);
printFilter->SetChannel(2);
printFilter->SetChannel(3);
PrintableWriterType::Pointer printWriter = PrintableWriterType::New();
printWriter->SetInput(printFilter->GetOutput());
printWriter->SetFileName(outputFileName);
printWriter->Update();
// Figure \ref{fig:SOMMAP} shows the result of the SOM learning. Since
// we have performed a learning on RGB pixel values, the produced SOM
// can be interpreted as an optimal color table for the input
// image. It can be observed that the obtained colors are
// topologically organised, so similar colors are also close in the
// map. This topological organisation can be exploited to further
// reduce the number of coding levels of the pixels without
// performing a new learning: we can subsample the map to get a new
// color table. Also, a bilinear interpolation between the neurons can
// be used to increase the number of coding levels.
// \begin{figure}
// \center
// \includegraphics[width=0.45\textwidth]{ROI_QB_MUL_1.eps}
// \includegraphics[width=0.2\textwidth]{ROI_QB_MUL_SOM.eps}
// \includegraphics[width=0.2\textwidth]{ROI_QB_MUL_SOMACT.eps}
// \itkcaption[SOM Image Classification]{Result of the SOM
// learning. Left: RGB image. Center: SOM. Right: Activation map}
// \label{fig:SOMMAP}
// \end{figure}
// We can now compute the activation map for the input image. The
// activation map tells us how many times a given neuron is activated
// for the set of examples given to the map. The activation map is
// stored as a scalar image and an integer pixel type is usually enough.
using OutputPixelType = unsigned char;
using OutputImageType = otb::Image<OutputPixelType, Dimension>;
using ActivationWriterType = otb::ImageFileWriter<OutputImageType>;
// In a similar way to the \doxygen{otb}{SOM} class the
// \doxygen{otb}{SOMActivationBuilder} is templated over the sample
// list given as input, the SOM map type and the activation map to be
// built as output.
using SOMActivationBuilderType = otb::SOMActivationBuilder<SampleListType, MapType, OutputImageType>;
// We instantiate the activation map builder and set as input the SOM
// map build before and the image (using the adaptor).
SOMActivationBuilderType::Pointer somAct = SOMActivationBuilderType::New();
somAct->SetInput(som->GetOutput());
somAct->SetListSample(sampleList);
somAct->Update();
// The final step is to write the activation map to a file.
if (actMapFileName != nullptr)
{
ActivationWriterType::Pointer actWriter = ActivationWriterType::New();
actWriter->SetFileName(actMapFileName);
// The righthand side of figure \ref{fig:SOMMAP} shows the activation
// map obtained.
// Just for visualization purposes, we zoom the image.
using ExpandType2 = itk::ExpandImageFilter<OutputImageType, OutputImageType>;
using InterpolatorType2 = itk::NearestNeighborInterpolateImageFunction<OutputImageType, double>;
InterpolatorType2::Pointer interpolator2 = InterpolatorType2::New();
ExpandType2::Pointer expand2 = ExpandType2::New();
expand2->SetInput(somAct->GetOutput());
expand2->SetExpandFactors(20);
expand2->SetInterpolator(interpolator2);
// expand2->SetEdgePaddingValue(255);
expand2->UpdateOutputInformation();
actWriter->SetInput(expand2->GetOutput());
actWriter->Update();
}
else
{
std::cerr << "The activation map file name is null" << std::endl;
return EXIT_FAILURE;
}
return EXIT_SUCCESS;
}