44 name = std::string(
"spatial_") + axis;
56 return spatial(height,
'y', width *
sizeof(
float));
61 return spatial(depth,
'z', width * height *
sizeof(
float));
71 uint64_t element_count,
72 uint8_t components_per_element,
107 const std::vector<uint64_t>& shape,
110 std::vector<DataDimension> dims;
115 if (shape.size() != 1) {
116 throw std::invalid_argument(
"AUDIO_1D requires 1D shape");
122 if (shape.size() != 2) {
123 throw std::invalid_argument(
"AUDIO_MULTICHANNEL requires 2D shape [samples, channels]");
130 if (shape.size() != 2) {
131 throw std::invalid_argument(
"IMAGE_2D requires 2D shape [height, width]");
138 if (shape.size() != 3) {
139 throw std::invalid_argument(
"IMAGE_COLOR requires 3D shape [height, width, channels]");
147 if (shape.size() != 2) {
148 throw std::invalid_argument(
"SPECTRAL_2D requires 2D shape [time_windows, frequency_bins]");
152 dims[1].stride = strides[1];
156 if (shape.size() != 3) {
157 throw std::invalid_argument(
"VOLUMETRIC_3D requires 3D shape [x, y, z]");
165 if (shape.size() != 3) {
166 throw std::invalid_argument(
"VIDEO_GRAYSCALE requires 3D shape [frames, height, width]");
174 if (shape.size() != 4) {
175 throw std::invalid_argument(
"VIDEO_COLOR requires 4D shape [frames, height, width, channels]");
184 throw std::invalid_argument(
"Unsupported modality for dimension creation");
191 const std::vector<uint64_t>& shape,
197 std::vector<uint64_t> strides(shape.size());
200 auto reversed_shape = shape | std::views::reverse;
202 reversed_shape.begin(),
203 reversed_shape.end(),
206 std::multiplies<uint64_t> {});
213 std::multiplies<uint64_t> {});
DataModality
Data modality types for cross-modal analysis.
@ AUDIO_MULTICHANNEL
Multi-channel audio.
@ SPECTRAL_2D
2D spectral data (time + frequency)
@ AUDIO_1D
1D audio signal
@ VOLUMETRIC_3D
3D volumetric data
@ VIDEO_GRAYSCALE
3D video (time + 2D grayscale)
@ VIDEO_COLOR
4D video (time + 2D + color)
@ IMAGE_COLOR
2D RGB/RGBA image
@ IMAGE_2D
2D image (grayscale or single channel)
MemoryLayout
Memory layout for multi-dimensional data.
@ ROW_MAJOR
C/C++ style (last dimension varies fastest)
std::string_view modality_to_string(DataModality modality)
Convert DataModality enum to string representation.
constexpr std::string_view enum_to_string(EnumType value) noexcept
Universal enum to string converter using magic_enum (original case)
Grouping information for sub-dimensions.
static DataDimension spatial_2d(uint64_t width, uint64_t height)
Convenience constructor for a 2D spatial dimension.
Role
Semantic role of the dimension.
@ COLOR
Color data (RGB/RGBA)
@ FREQUENCY
Spectral/frequency axis.
@ MIP_LEVEL
Mipmap levels.
@ SPATIAL_Y
Spatial Y axis.
@ TIME
Temporal progression (samples, frames, steps)
@ SPATIAL_Z
Spatial Z axis.
@ POSITION
Vertex positions (3D space)
@ CHANNEL
Parallel streams (audio channels, color channels)
@ SPATIAL_X
Spatial X axis (images, tensors)
uint64_t stride
Memory stride (elements between consecutive indices)
std::string name
Human-readable identifier for the dimension.
static DataDimension vertex_positions(uint64_t count)
Create dimension for vertex positions (vec3)
uint64_t size
Number of elements in this dimension.
static DataDimension vertex_colors(uint64_t count, bool has_alpha=false)
Create dimension for colors (vec3 or vec4)
Role role
Semantic hint for common operations.
static DataDimension spatial(uint64_t size, char axis, uint64_t stride=1, std::string name="spatial")
Convenience constructor for a spatial dimension.
static DataDimension grouped(std::string name, uint64_t element_count, uint8_t components_per_element, Role role=Role::CUSTOM)
Create dimension with component grouping.
static DataDimension vertex_normals(uint64_t count)
Create dimension for vertex normals (vec3)
static DataDimension frequency(uint64_t bins, std::string name="frequency")
Convenience constructor for a frequency dimension.
static DataDimension spatial_1d(uint64_t width)
Convenience constructor for an array dimension.
static DataDimension time(uint64_t samples, std::string name="time")
Convenience constructor for a temporal (time) dimension.
static std::vector< uint64_t > calculate_strides(const std::vector< uint64_t > &shape, MemoryLayout layout)
Calculate memory strides based on shape and layout.
static std::vector< DataDimension > create_dimensions(DataModality modality, const std::vector< uint64_t > &shape, MemoryLayout layout=MemoryLayout::ROW_MAJOR)
Create dimension descriptors for a data modality.
static DataDimension mipmap_levels(uint64_t levels)
Create dimension for mipmap levels.
static DataDimension texture_coords(uint64_t count)
Create dimension for texture coordinates (vec2)
static DataDimension spatial_3d(uint64_t width, uint64_t height, uint64_t depth)
Convenience constructor for a 3D spatial dimension.
std::optional< ComponentGroup > grouping
static DataDimension channel(uint64_t count, uint64_t stride=1)
Convenience constructor for a channel dimension.
Minimal dimension descriptor focusing on structure only.