MayaFlux 0.2.0
Digital-First Multimedia Processing Framework
Loading...
Searching...
No Matches

◆ create_dimensions()

std::vector< DataDimension > MayaFlux::Kakshya::DataDimension::create_dimensions ( DataModality  modality,
const std::vector< uint64_t > &  shape,
MemoryLayout  layout = MemoryLayout::ROW_MAJOR 
)
static

Create dimension descriptors for a data modality.

Parameters
modalityTarget data modality
shapeDimensional sizes
layoutMemory layout strategy
Returns
Vector of DataDimension objects

Definition at line 107 of file NDData.cpp.

111{
112 std::vector<DataDimension> dims;
113 auto strides = calculate_strides(shape, layout);
114
115 switch (modality) {
117 if (shape.size() != 1) {
118 error<std::invalid_argument>(
121 std::source_location::current(),
122 "AUDIO_1D requires 1D shape");
123 }
124 dims.push_back(DataDimension::time(shape[0]));
125 break;
126
128 if (shape.size() != 2) {
129 error<std::invalid_argument>(
132 std::source_location::current(),
133 "AUDIO_MULTICHANNEL requires 2D shape [samples, channels]");
134 }
135 dims.push_back(DataDimension::time(shape[0]));
136 dims.push_back(DataDimension::channel(shape[1], strides[1]));
137 break;
138
140 if (shape.size() != 2) {
141 error<std::invalid_argument>(
144 std::source_location::current(),
145 "IMAGE_2D requires 2D shape [height, width]");
146 }
147 dims.push_back(DataDimension::spatial(shape[0], 'y', strides[0]));
148 dims.push_back(DataDimension::spatial(shape[1], 'x', strides[1]));
149 break;
150
152 if (shape.size() != 3) {
153 error<std::invalid_argument>(
156 std::source_location::current(),
157 "IMAGE_COLOR requires 3D shape [height, width, channels]");
158 }
159 dims.push_back(DataDimension::spatial(shape[0], 'y', strides[0]));
160 dims.push_back(DataDimension::spatial(shape[1], 'x', strides[1]));
161 dims.push_back(DataDimension::channel(shape[2], strides[2]));
162 break;
163
165 if (shape.size() != 2) {
166 error<std::invalid_argument>(
169 std::source_location::current(),
170 "SPECTRAL_2D requires 2D shape [time_windows, frequency_bins]");
171 }
172 dims.push_back(DataDimension::time(shape[0], "time_windows"));
173 dims.push_back(DataDimension::frequency(shape[1]));
174 dims[1].stride = strides[1];
175 break;
176
178 if (shape.size() != 3) {
179 error<std::invalid_argument>(
182 std::source_location::current(),
183 "VOLUMETRIC_3D requires 3D shape [x, y, z]");
184 }
185 dims.push_back(DataDimension::spatial(shape[0], 'x', strides[0]));
186 dims.push_back(DataDimension::spatial(shape[1], 'y', strides[1]));
187 dims.push_back(DataDimension::spatial(shape[2], 'z', strides[2]));
188 break;
189
191 if (shape.size() != 3) {
192 error<std::invalid_argument>(
195 std::source_location::current(),
196 "VIDEO_GRAYSCALE requires 3D shape [frames, height, width]");
197 }
198 dims.push_back(DataDimension::time(shape[0], "frames"));
199 dims.push_back(DataDimension::spatial(shape[1], 'y', strides[1]));
200 dims.push_back(DataDimension::spatial(shape[2], 'x', strides[2]));
201 break;
202
204 if (shape.size() != 4) {
205 error<std::invalid_argument>(
208 std::source_location::current(),
209 "VIDEO_COLOR requires 4D shape [frames, height, width, channels]");
210 }
211 dims.push_back(DataDimension::time(shape[0], "frames"));
212 dims.push_back(DataDimension::spatial(shape[1], 'y', strides[1]));
213 dims.push_back(DataDimension::spatial(shape[2], 'x', strides[2]));
214 dims.push_back(DataDimension::channel(shape[3], strides[3]));
215 break;
216
217 default:
218 error<std::invalid_argument>(
221 std::source_location::current(),
222 "Unsupported modality for dimension creation: {}", modality_to_string(modality));
223 }
224
225 return dims;
226}
@ Runtime
General runtime operations (default fallback)
@ Kakshya
Containers[Signalsource, Stream, File], Regions, DataProcessors.
@ AUDIO_MULTICHANNEL
Multi-channel audio.
@ SPECTRAL_2D
2D spectral data (time + frequency)
@ VOLUMETRIC_3D
3D volumetric data
@ VIDEO_GRAYSCALE
3D video (time + 2D grayscale)
@ VIDEO_COLOR
4D video (time + 2D + color)
@ IMAGE_COLOR
2D RGB/RGBA image
@ IMAGE_2D
2D image (grayscale or single channel)
std::string_view modality_to_string(DataModality modality)
Convert DataModality enum to string representation.
Definition NDData.cpp:82
static DataDimension spatial(uint64_t size, char axis, uint64_t stride=1, std::string name="spatial")
Convenience constructor for a spatial dimension.
Definition NDData.cpp:31
static DataDimension frequency(uint64_t bins, std::string name="frequency")
Convenience constructor for a frequency dimension.
Definition NDData.cpp:26
static DataDimension time(uint64_t samples, std::string name="time")
Convenience constructor for a temporal (time) dimension.
Definition NDData.cpp:16
static std::vector< uint64_t > calculate_strides(const std::vector< uint64_t > &shape, MemoryLayout layout)
Calculate memory strides based on shape and layout.
Definition NDData.cpp:228
static DataDimension channel(uint64_t count, uint64_t stride=1)
Convenience constructor for a channel dimension.
Definition NDData.cpp:21

References MayaFlux::Kakshya::AUDIO_1D, MayaFlux::Kakshya::AUDIO_MULTICHANNEL, calculate_strides(), channel(), frequency(), MayaFlux::Kakshya::IMAGE_2D, MayaFlux::Kakshya::IMAGE_COLOR, MayaFlux::Journal::Kakshya, MayaFlux::Kakshya::modality_to_string(), MayaFlux::Journal::Runtime, spatial(), MayaFlux::Kakshya::SPECTRAL_2D, time(), MayaFlux::Kakshya::VIDEO_COLOR, MayaFlux::Kakshya::VIDEO_GRAYSCALE, and MayaFlux::Kakshya::VOLUMETRIC_3D.

Referenced by MayaFlux::Yantra::infer_from_region(), MayaFlux::Yantra::infer_from_region_group(), and MayaFlux::Kakshya::SoundStreamContainer::setup_dimensions().

+ Here is the call graph for this function:
+ Here is the caller graph for this function: