Ocean
InitializerAppearanceMappingI1.h
Go to the documentation of this file.
1 /*
2  * Copyright (c) Meta Platforms, Inc. and affiliates.
3  *
4  * This source code is licensed under the MIT license found in the
5  * LICENSE file in the root directory of this source tree.
6  */
7 
8 #ifndef META_OCEAN_CV_SYNTHESIS_INITIALIZER_APPEARANCE_MAPPING_I_1_H
9 #define META_OCEAN_CV_SYNTHESIS_INITIALIZER_APPEARANCE_MAPPING_I_1_H
10 
18 
19 #include "ocean/base/RandomI.h"
20 
22 
23 namespace Ocean
24 {
25 
26 namespace CV
27 {
28 
29 namespace Synthesis
30 {
31 
32 /**
33  * This class implements an initializer that initializes the mapping by appearance constraints for mappings with integer accuracy.
34  * For each mask pixel the best matching target pixel is assigned as initial mapping.<br>
35  * The matching is provided by a randomized test of best matching positions.
36  * @tparam tPatchSize Defines the patch size for the matching, must be 1
37  * @tparam tIterations Defines the number of random seek iterations for each pixel inside the synthesis mask, with range [1, infinity)
38  * @see LayerI1, MappingI.
39  * @ingroup cvsynthesis
40  */
41 template <unsigned int tPatchSize, unsigned int tIterations>
43  virtual public InitializerAppearanceMapping,
44  virtual public InitializerI,
45  virtual public InitializerRandomized,
46  virtual public InitializerSubset,
47  virtual public Initializer1
48 {
49  public:
50 
51  /**
52  * Creates a new initializer object.
53  * @param layer The layer for that the initial mapping has to be provided
54  * @param randomGenerator Random number generator
55  */
56  inline InitializerAppearanceMappingI1(LayerI1& layer, RandomGenerator& randomGenerator);
57 
58  private:
59 
60  /**
61  * Initializes a subset of the entire mapping area.
62  * @see InitializerSubset::initializeSubset().
63  * @see initializeSubsetChannels().
64  */
65  void initializeSubset(const unsigned int firstColumn, const unsigned int numberColumns, const unsigned int firstRow, const unsigned int numberRows) const override;
66 
67  /**
68  * This function is the specialization of the default initializeSubset() function.
69  * @param firstColumn First column of the mapping area to be initialized
70  * @param numberColumns Number of columns of the mapping area to be handled
71  * @param firstRow First row of the mapping area to be initialized
72  * @param numberRows Number of rows of the mapping area to be handled
73  * @tparam tChannels The number of channels the frame has, with range [1, infinity)
74  * @see initializeSubset().
75  */
76  template <unsigned int tChannels>
77  void initializeSubsetChannels(const unsigned int firstColumn, const unsigned int numberColumns, const unsigned int firstRow, const unsigned int numberRows) const;
78 };
79 
80 template <unsigned int tPatchSize, unsigned int tIterations>
82  Initializer(layer),
84  InitializerI(layer),
85  InitializerRandomized(layer, randomGenerator),
86  InitializerSubset(layer),
87  Initializer1(layer)
88 {
89  // nothing to do here
90 }
91 
92 template <unsigned int tPatchSize, unsigned int tIterations>
93 void InitializerAppearanceMappingI1<tPatchSize, tIterations>::initializeSubset(const unsigned int firstColumn, const unsigned int numberColumns, const unsigned int firstRow, const unsigned int numberRows) const
94 {
95  static_assert(tPatchSize == 1u, "Invalid patch size!");
96 
97  ocean_assert(layer_.frame().numberPlanes() == 1u);
98  ocean_assert(layer_.frame().dataType() == FrameType::DT_UNSIGNED_INTEGER_8);
99 
100  switch (layer_.frame().channels())
101  {
102  case 1u:
103  initializeSubsetChannels<1u>(firstColumn, numberColumns, firstRow, numberRows);
104  break;
105 
106  case 2u:
107  initializeSubsetChannels<2u>(firstColumn, numberColumns, firstRow, numberRows);
108  break;
109 
110  case 3u:
111  initializeSubsetChannels<3u>(firstColumn, numberColumns, firstRow, numberRows);
112  break;
113 
114  case 4u:
115  initializeSubsetChannels<4u>(firstColumn, numberColumns, firstRow, numberRows);
116  break;
117 
118  default:
119  ocean_assert(false && "Invalid frame type.");
120  }
121 }
122 
123 template <unsigned int tPatchSize, unsigned int tIterations>
124 template <unsigned int tChannels>
125 void InitializerAppearanceMappingI1<tPatchSize, tIterations>::initializeSubsetChannels(const unsigned int firstColumn, const unsigned int numberColumns, const unsigned int firstRow, const unsigned int numberRows) const
126 {
127  static_assert(tPatchSize == 1u, "Invalid patch size!");
128  static_assert(tChannels >= 1u, "Invalid channel number!");
129 
130  const unsigned int tPatchSize_2 = tPatchSize / 2u;
131 
132  const unsigned int width = layerI_.width();
133  const unsigned int height = layerI_.height();
134 
135  MappingI& layerMapping = layerI_.mapping();
136 
137  const Frame& frame = layerI_.frame();
138  const Frame& mask = layerI_.mask();
139 
140  ocean_assert(frame.isValid() && mask.isValid());
141 
142  ocean_assert(frame.numberPlanes() == 1u && frame.dataType() == FrameType::DT_UNSIGNED_INTEGER_8);
143  ocean_assert(frame.width() == width);
144  ocean_assert(frame.height() == height);
145 
146  ocean_assert(frame.isFrameTypeCompatible(FrameType(mask, frame.pixelFormat()), false));
147 
148  RandomGenerator randomGenerator(randomGenerator_);
149 
150  const uint8_t* const frameData = frame.constdata<uint8_t>();
151  const uint8_t* const maskData = mask.constdata<uint8_t>();
152 
153  const unsigned int framePaddingElements = frame.paddingElements();
154 
155  const unsigned int maskStrideElements = mask.strideElements();
156 
157 #ifdef OCEAN_DEBUG
158  const PixelBoundingBox& debugLayerBoundingBox = layerI_.boundingBox();
159  ocean_assert(!debugLayerBoundingBox || firstColumn >= debugLayerBoundingBox.left());
160  ocean_assert(!debugLayerBoundingBox || firstColumn + numberColumns <= debugLayerBoundingBox.rightEnd());
161  ocean_assert(!debugLayerBoundingBox || firstRow >= debugLayerBoundingBox.top());
162  ocean_assert(!debugLayerBoundingBox || firstRow + numberRows <= debugLayerBoundingBox.bottomEnd());
163 #endif // OCEAN_DEBUG
164 
165  ocean_assert(firstColumn + numberColumns <= width);
166  ocean_assert(firstRow + numberRows <= height);
167 
168  for (unsigned int y = firstRow; y < firstRow + numberRows; ++y)
169  {
170  const uint8_t* maskRow = maskData + y * maskStrideElements + firstColumn;
171  PixelPosition* position = layerMapping.row(y) + firstColumn;
172 
173  for (unsigned int x = firstColumn; x < firstColumn + numberColumns; ++x)
174  {
175  if (*maskRow++ != 0xFFu)
176  {
177  unsigned int bestX, bestY;
178 
179  do
180  {
181  bestX = RandomI::random(randomGenerator, tPatchSize_2, width - tPatchSize_2 - 1u);
182  bestY = RandomI::random(randomGenerator, tPatchSize_2, height - tPatchSize_2 - 1u);
183  }
184  while (maskData[bestY * maskStrideElements + bestX] != 0xFF);
185 
186  unsigned int bestSSD = CV::SumSquareDifferences::patch8BitPerChannel<tChannels, tPatchSize>(frameData, frameData, width, width, x, y, bestX, bestY, framePaddingElements, framePaddingElements);
187 
188  for (unsigned int n = 1u; n < tIterations; ++n)
189  {
190  const unsigned int candidateX = RandomI::random(randomGenerator, tPatchSize_2, width - tPatchSize_2 - 1u);
191  const unsigned int candidateY = RandomI::random(randomGenerator, tPatchSize_2, height - tPatchSize_2 - 1u);
192 
193  if (maskData[candidateY * maskStrideElements + candidateX] != 0xFF)
194  {
195  continue;
196  }
197 
198  const unsigned int candidateSSD = CV::SumSquareDifferences::patch8BitPerChannel<tChannels, tPatchSize>(frameData, frameData, width, width, x, y, candidateX, candidateY, framePaddingElements, framePaddingElements);
199 
200  if (candidateSSD < bestSSD)
201  {
202  bestX = candidateX;
203  bestY = candidateY;
204  bestSSD = candidateSSD;
205  }
206  }
207 
208  position->setPosition(bestX, bestY);
209  }
210 
211  ++position;
212  }
213  }
214 }
215 
216 }
217 
218 }
219 
220 }
221 
222 #endif // META_OCEAN_CV_SYNTHESIS_INITIALIZER_APPEARANCE_MAPPING_I_1_H
T left() const
Returns the left (including) pixel position of this bounding box.
Definition: PixelBoundingBox.h:416
T rightEnd() const
Returns the right (excluding) pixel position of this bounding box.
Definition: PixelBoundingBox.h:437
T bottomEnd() const
Returns the bottom (excluding) pixel position of this bounding box.
Definition: PixelBoundingBox.h:451
T top() const
Returns the top (including) pixel position of this bounding box.
Definition: PixelBoundingBox.h:423
void setPosition(const T &x, const T &y)
Sets the two coordinate values of this object.
Definition: PixelPosition.h:482
This class is the base class for all initializers that are provided for a single frame only.
Definition: Initializer1.h:29
This class implements the abstract base class for all appearance initializers.
Definition: InitializerAppearanceMapping.h:28
This class implements an initializer that initializes the mapping by appearance constraints for mappi...
Definition: InitializerAppearanceMappingI1.h:48
InitializerAppearanceMappingI1(LayerI1 &layer, RandomGenerator &randomGenerator)
Creates a new initializer object.
Definition: InitializerAppearanceMappingI1.h:81
void initializeSubsetChannels(const unsigned int firstColumn, const unsigned int numberColumns, const unsigned int firstRow, const unsigned int numberRows) const
This function is the specialization of the default initializeSubset() function.
Definition: InitializerAppearanceMappingI1.h:125
void initializeSubset(const unsigned int firstColumn, const unsigned int numberColumns, const unsigned int firstRow, const unsigned int numberRows) const override
Initializes a subset of the entire mapping area.
Definition: InitializerAppearanceMappingI1.h:93
This class implements the base class for all synthesis initializers.
Definition: Initializer.h:34
This class implements the base class for all initializer objects that are applied for mappings with i...
Definition: InitializerI.h:30
This class is the base class for all initializers that mainly initialize the synthesis mapping by a h...
Definition: InitializerRandomized.h:30
This class is the base class for all initializer objects that can separate the initialization process...
Definition: InitializerSubset.h:29
This class implements a single layer for pixel synthesis within one frame and pixel accuracy.
Definition: LayerI1.h:41
This class implements a mapping with integer accuracy.
Definition: MappingI.h:30
const PixelPosition * row(const unsigned int y) const
Returns the pointer to a mapping row.
Definition: MappingI.h:243
This class implements Ocean's image class.
Definition: Frame.h:1760
unsigned int strideElements(const unsigned int planeIndex=0u) const
Returns the number of elements within one row, including optional padding at the end of a row for a s...
Definition: Frame.h:4026
const T * constdata(const unsigned int planeIndex=0u) const
Returns a pointer to the read-only pixel data of a specific plane.
Definition: Frame.h:4136
bool isValid() const
Returns whether this frame is valid.
Definition: Frame.h:4416
unsigned int paddingElements(const unsigned int planeIndex=0u) const
Returns the optional number of padding elements at the end of each row for a specific plane.
Definition: Frame.h:4010
Definition of a frame type composed by the frame dimension, pixel format and pixel origin.
Definition: Frame.h:30
unsigned int width() const
Returns the width of the frame format in pixel.
Definition: Frame.h:3111
uint32_t numberPlanes() const
Returns the number of planes of the pixel format of this frame.
Definition: Frame.h:3151
PixelFormat pixelFormat() const
Returns the pixel format of the frame.
Definition: Frame.h:3121
@ DT_UNSIGNED_INTEGER_8
Unsigned 8 bit integer data type (uint8_t).
Definition: Frame.h:41
unsigned int height() const
Returns the height of the frame in pixel.
Definition: Frame.h:3116
DataType dataType() const
Returns the data type of the pixel format of this frame.
Definition: Frame.h:3131
bool isFrameTypeCompatible(const FrameType &frameType, const bool allowDifferentPixelOrigins) const
Returns whether this frame type is compatible with a given frame type.
Definition: Frame.h:3171
This class implements a generator for random numbers.
Definition: RandomGenerator.h:42
static unsigned int random(const unsigned int maxValue)
Returns one random integer value with specified maximum value.
The namespace covering the entire Ocean framework.
Definition: Accessor.h:15