Create dimension descriptors for a data modality.
112{
113 std::vector<DataDimension> dims;
115
116 switch (modality) {
118 if (shape.size() != 1) {
119 error<std::invalid_argument>(
122 std::source_location::current(),
123 "AUDIO_1D requires 1D shape");
124 }
126 break;
127
129 if (shape.size() != 2) {
130 error<std::invalid_argument>(
133 std::source_location::current(),
134 "AUDIO_MULTICHANNEL requires 2D shape [samples, channels]");
135 }
138 break;
139
141 if (shape.size() != 2) {
142 error<std::invalid_argument>(
145 std::source_location::current(),
146 "IMAGE_2D requires 2D shape [height, width]");
147 }
150 break;
151
153 if (shape.size() != 3) {
154 error<std::invalid_argument>(
157 std::source_location::current(),
158 "IMAGE_COLOR requires 3D shape [height, width, channels]");
159 }
163 break;
164
166 if (shape.size() != 2) {
167 error<std::invalid_argument>(
170 std::source_location::current(),
171 "SPECTRAL_2D requires 2D shape [time_windows, frequency_bins]");
172 }
175 dims[1].stride = strides[1];
176 break;
177
179 if (shape.size() != 3) {
180 error<std::invalid_argument>(
183 std::source_location::current(),
184 "VOLUMETRIC_3D requires 3D shape [x, y, z]");
185 }
189 break;
190
192 if (shape.size() != 3) {
193 error<std::invalid_argument>(
196 std::source_location::current(),
197 "VIDEO_GRAYSCALE requires 3D shape [frames, height, width]");
198 }
202 break;
203
205 if (shape.size() != 4) {
206 error<std::invalid_argument>(
209 std::source_location::current(),
210 "VIDEO_COLOR requires 4D shape [frames, height, width, channels]");
211 }
216 break;
217
218 default:
219 error<std::invalid_argument>(
222 std::source_location::current(),
224 }
225
226 return dims;
227}
@ Runtime
General runtime operations (default fallback)
@ Kakshya
Containers[Signalsource, Stream, File], Regions, DataProcessors.
@ AUDIO_MULTICHANNEL
Multi-channel audio.
@ SPECTRAL_2D
2D spectral data (time + frequency)
@ AUDIO_1D
1D audio signal
@ VOLUMETRIC_3D
3D volumetric data
@ VIDEO_GRAYSCALE
3D video (time + 2D grayscale)
@ VIDEO_COLOR
4D video (time + 2D + color)
@ IMAGE_COLOR
2D RGB/RGBA image
@ IMAGE_2D
2D image (grayscale or single channel)
std::string_view modality_to_string(DataModality modality)
Convert DataModality enum to string representation.
static DataDimension spatial(uint64_t size, char axis, uint64_t stride=1, std::string name="spatial")
Convenience constructor for a spatial dimension.
static DataDimension frequency(uint64_t bins, std::string name="frequency")
Convenience constructor for a frequency dimension.
static DataDimension time(uint64_t samples, std::string name="time")
Convenience constructor for a temporal (time) dimension.
static std::vector< uint64_t > calculate_strides(const std::vector< uint64_t > &shape, MemoryLayout layout)
Calculate memory strides based on shape and layout.
static DataDimension channel(uint64_t count, uint64_t stride=1)
Convenience constructor for a channel dimension.