Ocean
Loading...
Searching...
No Matches
InitializerAppearanceMappingI1.h
Go to the documentation of this file.
1/*
2 * Copyright (c) Meta Platforms, Inc. and affiliates.
3 *
4 * This source code is licensed under the MIT license found in the
5 * LICENSE file in the root directory of this source tree.
6 */
7
8#ifndef META_OCEAN_CV_SYNTHESIS_INITIALIZER_APPEARANCE_MAPPING_I_1_H
9#define META_OCEAN_CV_SYNTHESIS_INITIALIZER_APPEARANCE_MAPPING_I_1_H
10
18
19#include "ocean/base/RandomI.h"
20
22
23namespace Ocean
24{
25
26namespace CV
27{
28
29namespace Synthesis
30{
31
32/**
33 * This class implements an initializer that initializes the mapping by appearance constraints for mappings with integer accuracy.
34 * For each mask pixel the best matching target pixel is assigned as initial mapping.<br>
35 * The matching is provided by a randomized test of best matching positions.
36 * @tparam tPatchSize Defines the patch size for the matching, must be 1
37 * @tparam tIterations Defines the number of random seek iterations for each pixel inside the synthesis mask, with range [1, infinity)
38 * @see LayerI1, MappingI.
39 * @ingroup cvsynthesis
40 */
41template <unsigned int tPatchSize, unsigned int tIterations>
43 virtual public InitializerAppearanceMapping,
44 virtual public InitializerI,
45 virtual public InitializerRandomized,
46 virtual public InitializerSubset,
47 virtual public Initializer1
48{
49 public:
50
51 /**
52 * Creates a new initializer object.
53 * @param layer The layer for that the initial mapping has to be provided
54 * @param randomGenerator Random number generator
55 */
56 inline InitializerAppearanceMappingI1(LayerI1& layer, RandomGenerator& randomGenerator);
57
58 private:
59
60 /**
61 * Initializes a subset of the entire mapping area.
62 * @see InitializerSubset::initializeSubset().
63 * @see initializeSubsetChannels().
64 */
65 void initializeSubset(const unsigned int firstColumn, const unsigned int numberColumns, const unsigned int firstRow, const unsigned int numberRows) const override;
66
67 /**
68 * This function is the specialization of the default initializeSubset() function.
69 * @param firstColumn First column of the mapping area to be initialized
70 * @param numberColumns Number of columns of the mapping area to be handled
71 * @param firstRow First row of the mapping area to be initialized
72 * @param numberRows Number of rows of the mapping area to be handled
73 * @tparam tChannels The number of channels the frame has, with range [1, infinity)
74 * @see initializeSubset().
75 */
76 template <unsigned int tChannels>
77 void initializeSubsetChannels(const unsigned int firstColumn, const unsigned int numberColumns, const unsigned int firstRow, const unsigned int numberRows) const;
78};
79
80template <unsigned int tPatchSize, unsigned int tIterations>
82 Initializer(layer),
84 InitializerI(layer),
85 InitializerRandomized(layer, randomGenerator),
86 InitializerSubset(layer),
87 Initializer1(layer)
88{
89 // nothing to do here
90}
91
92template <unsigned int tPatchSize, unsigned int tIterations>
93void InitializerAppearanceMappingI1<tPatchSize, tIterations>::initializeSubset(const unsigned int firstColumn, const unsigned int numberColumns, const unsigned int firstRow, const unsigned int numberRows) const
94{
95 static_assert(tPatchSize == 1u, "Invalid patch size!");
96
97 ocean_assert(layer_.frame().numberPlanes() == 1u);
98 ocean_assert(layer_.frame().dataType() == FrameType::DT_UNSIGNED_INTEGER_8);
99
100 switch (layer_.frame().channels())
101 {
102 case 1u:
103 initializeSubsetChannels<1u>(firstColumn, numberColumns, firstRow, numberRows);
104 break;
105
106 case 2u:
107 initializeSubsetChannels<2u>(firstColumn, numberColumns, firstRow, numberRows);
108 break;
109
110 case 3u:
111 initializeSubsetChannels<3u>(firstColumn, numberColumns, firstRow, numberRows);
112 break;
113
114 case 4u:
115 initializeSubsetChannels<4u>(firstColumn, numberColumns, firstRow, numberRows);
116 break;
117
118 default:
119 ocean_assert(false && "Invalid frame type.");
120 }
121}
122
123template <unsigned int tPatchSize, unsigned int tIterations>
124template <unsigned int tChannels>
125void InitializerAppearanceMappingI1<tPatchSize, tIterations>::initializeSubsetChannels(const unsigned int firstColumn, const unsigned int numberColumns, const unsigned int firstRow, const unsigned int numberRows) const
126{
127 static_assert(tPatchSize == 1u, "Invalid patch size!");
128 static_assert(tChannels >= 1u, "Invalid channel number!");
129
130 const unsigned int tPatchSize_2 = tPatchSize / 2u;
131
132 const unsigned int width = layerI_.width();
133 const unsigned int height = layerI_.height();
134
135 MappingI& layerMapping = layerI_.mapping();
136
137 const Frame& frame = layerI_.frame();
138 const Frame& mask = layerI_.mask();
139
140 ocean_assert(frame.isValid() && mask.isValid());
141
142 ocean_assert(frame.numberPlanes() == 1u && frame.dataType() == FrameType::DT_UNSIGNED_INTEGER_8);
143 ocean_assert(frame.width() == width);
144 ocean_assert(frame.height() == height);
145
146 ocean_assert(frame.isFrameTypeCompatible(FrameType(mask, frame.pixelFormat()), false));
147
148 RandomGenerator randomGenerator(randomGenerator_);
149
150 const uint8_t* const frameData = frame.constdata<uint8_t>();
151 const uint8_t* const maskData = mask.constdata<uint8_t>();
152
153 const unsigned int framePaddingElements = frame.paddingElements();
154
155 const unsigned int maskStrideElements = mask.strideElements();
156
157#ifdef OCEAN_DEBUG
158 const PixelBoundingBox& debugLayerBoundingBox = layerI_.boundingBox();
159 ocean_assert(!debugLayerBoundingBox || firstColumn >= debugLayerBoundingBox.left());
160 ocean_assert(!debugLayerBoundingBox || firstColumn + numberColumns <= debugLayerBoundingBox.rightEnd());
161 ocean_assert(!debugLayerBoundingBox || firstRow >= debugLayerBoundingBox.top());
162 ocean_assert(!debugLayerBoundingBox || firstRow + numberRows <= debugLayerBoundingBox.bottomEnd());
163#endif // OCEAN_DEBUG
164
165 ocean_assert(firstColumn + numberColumns <= width);
166 ocean_assert(firstRow + numberRows <= height);
167
168 for (unsigned int y = firstRow; y < firstRow + numberRows; ++y)
169 {
170 const uint8_t* maskRow = maskData + y * maskStrideElements + firstColumn;
171 PixelPosition* position = layerMapping.row(y) + firstColumn;
172
173 for (unsigned int x = firstColumn; x < firstColumn + numberColumns; ++x)
174 {
175 if (*maskRow++ != 0xFFu)
176 {
177 unsigned int bestX, bestY;
178
179 do
180 {
181 bestX = RandomI::random(randomGenerator, tPatchSize_2, width - tPatchSize_2 - 1u);
182 bestY = RandomI::random(randomGenerator, tPatchSize_2, height - tPatchSize_2 - 1u);
183 }
184 while (maskData[bestY * maskStrideElements + bestX] != 0xFF);
185
186 unsigned int bestSSD = CV::SumSquareDifferences::patch8BitPerChannel<tChannels, tPatchSize>(frameData, frameData, width, width, x, y, bestX, bestY, framePaddingElements, framePaddingElements);
187
188 for (unsigned int n = 1u; n < tIterations; ++n)
189 {
190 const unsigned int candidateX = RandomI::random(randomGenerator, tPatchSize_2, width - tPatchSize_2 - 1u);
191 const unsigned int candidateY = RandomI::random(randomGenerator, tPatchSize_2, height - tPatchSize_2 - 1u);
192
193 if (maskData[candidateY * maskStrideElements + candidateX] != 0xFF)
194 {
195 continue;
196 }
197
198 const unsigned int candidateSSD = CV::SumSquareDifferences::patch8BitPerChannel<tChannels, tPatchSize>(frameData, frameData, width, width, x, y, candidateX, candidateY, framePaddingElements, framePaddingElements);
199
200 if (candidateSSD < bestSSD)
201 {
202 bestX = candidateX;
203 bestY = candidateY;
204 bestSSD = candidateSSD;
205 }
206 }
207
208 position->setPosition(bestX, bestY);
209 }
210
211 ++position;
212 }
213 }
214}
215
216}
217
218}
219
220}
221
222#endif // META_OCEAN_CV_SYNTHESIS_INITIALIZER_APPEARANCE_MAPPING_I_1_H
T left() const
Returns the left (including) pixel position of this bounding box.
Definition PixelBoundingBox.h:416
T rightEnd() const
Returns the right (excluding) pixel position of this bounding box.
Definition PixelBoundingBox.h:437
T bottomEnd() const
Returns the bottom (excluding) pixel position of this bounding box.
Definition PixelBoundingBox.h:451
T top() const
Returns the top (including) pixel position of this bounding box.
Definition PixelBoundingBox.h:423
void setPosition(const T &x, const T &y)
Sets the two coordinate values of this object.
Definition PixelPosition.h:482
This class is the base class for all initializers that are provided for a single frame only.
Definition Initializer1.h:29
This class implements the abstract base class for all appearance initializers.
Definition InitializerAppearanceMapping.h:28
This class implements an initializer that initializes the mapping by appearance constraints for mappi...
Definition InitializerAppearanceMappingI1.h:48
InitializerAppearanceMappingI1(LayerI1 &layer, RandomGenerator &randomGenerator)
Creates a new initializer object.
Definition InitializerAppearanceMappingI1.h:81
void initializeSubsetChannels(const unsigned int firstColumn, const unsigned int numberColumns, const unsigned int firstRow, const unsigned int numberRows) const
This function is the specialization of the default initializeSubset() function.
Definition InitializerAppearanceMappingI1.h:125
void initializeSubset(const unsigned int firstColumn, const unsigned int numberColumns, const unsigned int firstRow, const unsigned int numberRows) const override
Initializes a subset of the entire mapping area.
Definition InitializerAppearanceMappingI1.h:93
This class implements the base class for all synthesis initializers.
Definition Initializer.h:34
This class implements the base class for all initializer objects that are applied for mappings with i...
Definition InitializerI.h:30
This class is the base class for all initializers that mainly initialize the synthesis mapping by a h...
Definition InitializerRandomized.h:30
This class is the base class for all initializer objects that can separate the initialization process...
Definition InitializerSubset.h:29
This class implements a single layer for pixel synthesis within one frame and pixel accuracy.
Definition LayerI1.h:41
This class implements a mapping with integer accuracy.
Definition MappingI.h:30
const PixelPosition * row(const unsigned int y) const
Returns the pointer to a mapping row.
Definition MappingI.h:243
This class implements Ocean's image class.
Definition Frame.h:1808
unsigned int strideElements(const unsigned int planeIndex=0u) const
Returns the number of elements within one row, including optional padding at the end of a row for a s...
Definition Frame.h:4138
const T * constdata(const unsigned int planeIndex=0u) const
Returns a pointer to the read-only pixel data of a specific plane.
Definition Frame.h:4248
bool isValid() const
Returns whether this frame is valid.
Definition Frame.h:4528
unsigned int paddingElements(const unsigned int planeIndex=0u) const
Returns the optional number of padding elements at the end of each row for a specific plane.
Definition Frame.h:4122
Definition of a frame type composed by the frame dimension, pixel format and pixel origin.
Definition Frame.h:30
unsigned int width() const
Returns the width of the frame format in pixel.
Definition Frame.h:3170
uint32_t numberPlanes() const
Returns the number of planes of the pixel format of this frame.
Definition Frame.h:3210
PixelFormat pixelFormat() const
Returns the pixel format of the frame.
Definition Frame.h:3180
@ DT_UNSIGNED_INTEGER_8
Unsigned 8 bit integer data type (uint8_t).
Definition Frame.h:41
unsigned int height() const
Returns the height of the frame in pixel.
Definition Frame.h:3175
DataType dataType() const
Returns the data type of the pixel format of this frame.
Definition Frame.h:3190
bool isFrameTypeCompatible(const FrameType &frameType, const bool allowDifferentPixelOrigins) const
Returns whether this frame type is compatible with a given frame type.
Definition Frame.h:3232
This class implements a generator for random numbers.
Definition RandomGenerator.h:42
static unsigned int random(const unsigned int maxValue)
Returns one random integer value with specified maximum value.
The namespace covering the entire Ocean framework.
Definition Accessor.h:15