Create dimension descriptors for a data modality.
111{
112 std::vector<DataDimension> dims;
114
115 switch (modality) {
117 if (shape.size() != 1) {
118 error<std::invalid_argument>(
121 std::source_location::current(),
122 "AUDIO_1D requires 1D shape");
123 }
125 break;
126
128 if (shape.size() != 2) {
129 error<std::invalid_argument>(
132 std::source_location::current(),
133 "AUDIO_MULTICHANNEL requires 2D shape [samples, channels]");
134 }
137 break;
138
140 if (shape.size() != 2) {
141 error<std::invalid_argument>(
144 std::source_location::current(),
145 "IMAGE_2D requires 2D shape [height, width]");
146 }
149 break;
150
152 if (shape.size() != 3) {
153 error<std::invalid_argument>(
156 std::source_location::current(),
157 "IMAGE_COLOR requires 3D shape [height, width, channels]");
158 }
162 break;
163
165 if (shape.size() != 2) {
166 error<std::invalid_argument>(
169 std::source_location::current(),
170 "SPECTRAL_2D requires 2D shape [time_windows, frequency_bins]");
171 }
174 dims[1].stride = strides[1];
175 break;
176
178 if (shape.size() != 3) {
179 error<std::invalid_argument>(
182 std::source_location::current(),
183 "VOLUMETRIC_3D requires 3D shape [x, y, z]");
184 }
188 break;
189
191 if (shape.size() != 3) {
192 error<std::invalid_argument>(
195 std::source_location::current(),
196 "VIDEO_GRAYSCALE requires 3D shape [frames, height, width]");
197 }
201 break;
202
204 if (shape.size() != 4) {
205 error<std::invalid_argument>(
208 std::source_location::current(),
209 "VIDEO_COLOR requires 4D shape [frames, height, width, channels]");
210 }
215 break;
216
217 default:
218 error<std::invalid_argument>(
221 std::source_location::current(),
223 }
224
225 return dims;
226}
@ Runtime
General runtime operations (default fallback)
@ Kakshya
Containers[Signalsource, Stream, File], Regions, DataProcessors.
@ AUDIO_MULTICHANNEL
Multi-channel audio.
@ SPECTRAL_2D
2D spectral data (time + frequency)
@ AUDIO_1D
1D audio signal
@ VOLUMETRIC_3D
3D volumetric data
@ VIDEO_GRAYSCALE
3D video (time + 2D grayscale)
@ VIDEO_COLOR
4D video (time + 2D + color)
@ IMAGE_COLOR
2D RGB/RGBA image
@ IMAGE_2D
2D image (grayscale or single channel)
std::string_view modality_to_string(DataModality modality)
Convert DataModality enum to string representation.
static DataDimension spatial(uint64_t size, char axis, uint64_t stride=1, std::string name="spatial")
Convenience constructor for a spatial dimension.
static DataDimension frequency(uint64_t bins, std::string name="frequency")
Convenience constructor for a frequency dimension.
static DataDimension time(uint64_t samples, std::string name="time")
Convenience constructor for a temporal (time) dimension.
static std::vector< uint64_t > calculate_strides(const std::vector< uint64_t > &shape, MemoryLayout layout)
Calculate memory strides based on shape and layout.
static DataDimension channel(uint64_t count, uint64_t stride=1)
Convenience constructor for a channel dimension.