MayaFlux/SoundFileReader_8hpp_source.html

#pragma once


#include "FileReader.hpp"

#include "MayaFlux/Kakshya/Source/SoundFileContainer.hpp"


// Forward declarations for FFmpeg types

extern "C" {

struct AVFormatContext;

struct AVCodecContext;

struct AVFrame;

struct AVPacket;

struct SwrContext;

}


namespace MayaFlux::IO {


/**

 * @enum AudioReadOptions

 * @brief Audio-specific reading options

 */


enum class AudioReadOptions : uint32_t {

    NONE = 0,

    NORMALIZE = 1 << 0, // Not implemented - would use FFmpeg's volume filter

    CONVERT_TO_MONO = 1 << 2, // Not implemented - would use FFmpeg's channel mixer

    DEINTERLEAVE = 1 << 3, // Convert from interleaved to planar layout

    ALL = 0xFFFFFFFF

};


inline AudioReadOptions operator|(AudioReadOptions a, AudioReadOptions b)

{

    return static_cast<AudioReadOptions>(static_cast<uint32_t>(a) | static_cast<uint32_t>(b));

}


inline AudioReadOptions operator&(AudioReadOptions a, AudioReadOptions b)

{

    return static_cast<AudioReadOptions>(static_cast<uint32_t>(a) & static_cast<uint32_t>(b));

}


/**

 * @brief RAII wrapper for FFmpeg contexts with proper cleanup

 *

 * This struct holds all FFmpeg-related state and ensures proper cleanup order.

 * Shared ownership allows safe concurrent access with reader-writer semantics.

 */


struct FFmpegContext {

    AVFormatContext* format_context = nullptr;

    AVCodecContext* codec_context = nullptr;

    SwrContext* swr_context = nullptr;

    int audio_stream_index = -1;

    uint64_t total_frames = 0;

    uint32_t sample_rate = 0;

    uint32_t channels = 0;


    ~FFmpegContext();


    // Non-copyable, non-movable (managed by shared_ptr)

    FFmpegContext() = default;

    FFmpegContext(const FFmpegContext&) = delete;

    FFmpegContext& operator=(const FFmpegContext&) = delete;

    FFmpegContext(FFmpegContext&&) = delete;

    FFmpegContext& operator=(FFmpegContext&&) = delete;


    bool is_valid() const

    {

        return format_context && codec_context && audio_stream_index >= 0;

    }


};


/**

 * @class SoundFileReader

 * @brief FFmpeg-based audio file reader for MayaFlux

 *

 * SoundFileReader provides a high-level interface for reading and decoding audio files using FFmpeg.

 * It supports a wide range of audio formats, automatic sample format conversion to double precision,

 * resampling, metadata extraction, region/marker extraction, and streaming/seekable access.

 *

 * Key Features:

 * - Format detection and demuxing via libavformat

 * - Audio decoding via libavcodec

 * - Sample format conversion and resampling via libswresample (always outputs double)

 * - Metadata and region extraction from FFmpeg's parsed structures

 * - Seeking and timestamp handling via FFmpeg's APIs

 * - Automatic creation and population of Kakshya::SoundFileContainer for downstream processing

 * - Thread-safe access for reading and metadata queries

 *

 * Usage:

 *   SoundFileReader reader;

 *   if (reader.open("file.wav")) {

 *       auto metadata = reader.get_metadata();

 *       auto all_data = reader.read_all();

 *       auto container = reader.create_container();

 *       // ...

 *       reader.close();

 *   }

 *

 * All audio data is converted to double precision for internal processing.

 * The reader can output data in either interleaved or deinterleaved (planar) layout.

 */


class SoundFileReader : public FileReader {

public:

    /**

     * @brief Construct a new SoundFileReader object.

     * Initializes internal state and prepares for file operations.

     */

    SoundFileReader();


    /**

     * @brief Destroy the SoundFileReader object.

     * Cleans up FFmpeg resources and internal state.

     */

    ~SoundFileReader() override;


    /**

     * @brief Check if this reader can open the given file.

     * @param filepath Path to the file.

     * @return True if the file can be read, false otherwise.

     */

    bool can_read(const std::string& filepath) const override;


    /**

     * @brief Open an audio file for reading.

     * @param filepath Path to the file.

     * @param options File read options.

     * @return True if the file was opened successfully.

     */

    bool open(const std::string& filepath, FileReadOptions options = FileReadOptions::ALL) override;


    /**

     * @brief Close the currently open file and release resources.

     */

    void close() override;


    /**

     * @brief Check if a file is currently open.

     * @return True if a file is open, false otherwise.

     */

    bool is_open() const override;


    /**

     * @brief Get metadata for the currently open file.

     * @return Optional FileMetadata structure.

     */

    std::optional<FileMetadata> get_metadata() const override;


    /**

     * @brief Get all regions (markers, loops, etc.) from the file.

     * @return Vector of FileRegion structures.

     */

    std::vector<FileRegion> get_regions() const override;


    /**

     * @brief Read the entire audio file into memory.

     * @return DataVariant containing audio data as std::vector<double>.

     */

    std::vector<Kakshya::DataVariant> read_all() override;


    /**

     * @brief Read a specific region from the file.

     * @param region Region to read.

     * @return DataVariant containing region data.

     */

    std::vector<Kakshya::DataVariant> read_region(const FileRegion& region) override;


    /**

     * @brief Create a SignalSourceContainer for this file.

     * @return Shared pointer to a new SignalSourceContainer.

     */

    std::shared_ptr<Kakshya::SignalSourceContainer> create_container() override;


    /**

     * @brief Load file data into an existing SignalSourceContainer.

     * @param container Target container.

     * @return True if loading succeeded.

     */

    bool load_into_container(std::shared_ptr<Kakshya::SignalSourceContainer> container) override;


    /**

     * @brief Get the current read position in the file.

     * @return Vector of dimension indices (e.g., frame index).

     */

    std::vector<uint64_t> get_read_position() const override;


    /**

     * @brief Seek to a specific position in the file.

     * @param position Vector of dimension indices.

     * @return True if seek succeeded.

     */

    bool seek(const std::vector<uint64_t>& position) override;


    /**

     * @brief Get supported file extensions for this reader.

     * @return Vector of supported extensions (e.g., "wav", "flac").

     */

    std::vector<std::string> get_supported_extensions() const override;


    /**

     * @brief Get the C++ type of the data returned by this reader.

     * @return Type index for std::vector<double>.

     */

    std::type_index get_data_type() const override { return typeid(std::vector<double>); }


    /**

     * @brief Get the C++ type of the container returned by this reader.

     * @return Type index for Kakshya::SoundFileContainer.

     */

    std::type_index get_container_type() const override { return typeid(Kakshya::SoundFileContainer); }


    /**

     * @brief Get the last error message encountered by the reader.

     * @return Error string.

     */

    std::string get_last_error() const override;


    /**

     * @brief Check if the reader supports streaming access.

     * @return True if streaming is supported.

     */

    bool supports_streaming() const override;


    /**

     * @brief Get the preferred chunk size for streaming reads.

     * @return Preferred chunk size in frames.

     */

    uint64_t get_preferred_chunk_size() const override;


    /**

     * @brief Get the number of dimensions in the audio data (typically 2: time, channel).

     * @return Number of dimensions.

     */

    size_t get_num_dimensions() const override;


    /**

     * @brief Get the size of each dimension (e.g., frames, channels).

     * @return Vector of dimension sizes.

     */

    std::vector<uint64_t> get_dimension_sizes() const override;


    /**

     * @brief Read a specific number of frames from the file.

     * @param num_frames Number of frames to read.

     * @param offset Frame offset from beginning.

     * @return DataVariant containing std::vector<double>.

     */

    std::vector<Kakshya::DataVariant> read_frames(uint64_t num_frames, uint64_t offset = 0);


    /**

     * @brief Set audio-specific read options.

     * @param options Audio read options (e.g., DEINTERLEAVE).

     */

    void set_audio_options(AudioReadOptions options) { m_audio_options = options; }


    /**

     * @brief Set the target sample rate for resampling.

     * @param sample_rate Target sample rate (0 = no resampling).

     */

    void set_target_sample_rate(uint32_t sample_rate) { m_target_sample_rate = sample_rate; }


    /**

     * @brief Set the target bit depth (ignored, always outputs double).

     * @param bit_depth Target bit depth.

     * @deprecated Always outputs double precision.

     */

    void set_target_bit_depth(uint32_t bit_depth) { m_target_bit_depth = bit_depth; }


    /**

     * @brief Initialize FFmpeg libraries (thread-safe, called automatically).

     */

    static void initialize_ffmpeg();


private:

    // FFmpeg contexts - let FFmpeg manage these


    // Shared FFmpeg context - enables safe concurrent access

    std::shared_ptr<FFmpegContext> m_context;


    // Reader-writer lock: multiple readers OR single writer

    mutable std::shared_mutex m_context_mutex;


    /**

     * @brief Path to the currently open file.

     */

    std::string m_filepath;


    /**

     * @brief File read options used for this session.

     */

    FileReadOptions m_options;


    /**

     * @brief Audio-specific read options.

     */

    AudioReadOptions m_audio_options = AudioReadOptions::NONE;


    /**

     * @brief Last error message encountered.

     */

    mutable std::string m_last_error;


    /**

     * @brief Cached file metadata.

     */

    mutable std::optional<FileMetadata> m_cached_metadata;


    /**

     * @brief Cached file regions (markers, loops, etc.).

     */

    mutable std::vector<FileRegion> m_cached_regions;


    /**

     * @brief Current frame position for reading.

     */

    std::atomic<uint64_t> m_current_frame_position { 0 };


    /**

     * @brief Target sample rate for resampling (0 = use source rate).

     */

    uint32_t m_target_sample_rate = 0;


    /**

     * @brief Target bit depth (ignored, always outputs double).

     */

    uint32_t m_target_bit_depth = 0;


    /**

     * @brief Mutex for thread-safe metadata access.

     */

    mutable std::mutex m_metadata_mutex;


    // Simplified internal methods


    /**

     * @brief Set up the FFmpeg resampler if needed.

     * @return True if setup succeeded.

     */

    bool setup_resampler(const std::shared_ptr<FFmpegContext>& ctx);


    /**

     * @brief Extract metadata from the file.

     */

    void extract_metadata(const std::shared_ptr<FFmpegContext>& ctx);


    /**

     * @brief Extract region information from the file.

     */

    void extract_regions(const std::shared_ptr<FFmpegContext>& ctx);


    /**

     * @brief Decode a specific number of frames from the file.

     * @param ctx FFmpeg context.

     * @param num_frames Number of frames to decode.

     * @param offset Frame offset from beginning.

     * @return DataVariant containing decoded data.

     */

    std::vector<Kakshya::DataVariant> decode_frames(

        std::shared_ptr<FFmpegContext> ctx,

        uint64_t num_frames,

        uint64_t offset);


    /**

     * @brief Internal seek implementation.

     * @param ctx FFmpeg context.

     * @param frame_position Target frame position.

     * @return True if seek succeeded.

     */

    bool seek_internal(std::shared_ptr<FFmpegContext>& ctx, uint64_t frame_position);


    /**

     * @brief Convert interleaved audio data to deinterleaved (planar) format.

     * @param interleaved Input interleaved data.

     * @param channels Number of channels.

     * @return Deinterleaved data as std::vector<double>.

     */

    std::vector<std::vector<double>> deinterleave_data(const std::vector<double>& interleaved, uint32_t channels);


    /**

     * @brief Set the last error message.

     * @param error Error string.

     */

    void set_error(const std::string& error) const;


    /**

     * @brief Clear the last error message.

     */

    void clear_error() const;


    /**

     * @brief True if FFmpeg has been initialized.

     */

    static std::atomic<bool> s_ffmpeg_initialized;


    /**

     * @brief Mutex for FFmpeg initialization.

     */

    static std::mutex s_ffmpeg_init_mutex;

};


} // namespace MayaFlux::IO

FileReader.hpp

SoundFileContainer.hpp

MayaFlux::IO::FileReader
Abstract interface for reading various file formats into containers.
Definition FileReader.hpp:120

MayaFlux::IO::SoundFileReader::read_all
std::vector< Kakshya::DataVariant > read_all() override
Read the entire audio file into memory.
Definition SoundFileReader.cpp:500

MayaFlux::IO::SoundFileReader::close
void close() override
Close the currently open file and release resources.
Definition SoundFileReader.cpp:217

MayaFlux::IO::SoundFileReader::get_last_error
std::string get_last_error() const override
Get the last error message encountered by the reader.
Definition SoundFileReader.cpp:911

MayaFlux::IO::SoundFileReader::get_preferred_chunk_size
uint64_t get_preferred_chunk_size() const override
Get the preferred chunk size for streaming reads.
Definition SoundFileReader.cpp:871

MayaFlux::IO::SoundFileReader::m_target_sample_rate
uint32_t m_target_sample_rate
Target sample rate for resampling (0 = use source rate).
Definition SoundFileReader.hpp:317

MayaFlux::IO::SoundFileReader::supports_streaming
bool supports_streaming() const override
Check if the reader supports streaming access.
Definition SoundFileReader.cpp:917

MayaFlux::IO::SoundFileReader::open
bool open(const std::string &filepath, FileReadOptions options=FileReadOptions::ALL) override
Open an audio file for reading.
Definition SoundFileReader.cpp:130

MayaFlux::IO::SoundFileReader::load_into_container
bool load_into_container(std::shared_ptr< Kakshya::SignalSourceContainer > container) override
Load file data into an existing SignalSourceContainer.
Definition SoundFileReader.cpp:815

MayaFlux::IO::SoundFileReader::m_context_mutex
std::shared_mutex m_context_mutex
Definition SoundFileReader.hpp:277

MayaFlux::IO::SoundFileReader::can_read
bool can_read(const std::string &filepath) const override
Check if this reader can open the given file.
Definition SoundFileReader.cpp:111

MayaFlux::IO::SoundFileReader::m_target_bit_depth
uint32_t m_target_bit_depth
Target bit depth (ignored, always outputs double).
Definition SoundFileReader.hpp:322

MayaFlux::IO::SoundFileReader::m_metadata_mutex
std::mutex m_metadata_mutex
Mutex for thread-safe metadata access.
Definition SoundFileReader.hpp:327

MayaFlux::IO::SoundFileReader::s_ffmpeg_initialized
static std::atomic< bool > s_ffmpeg_initialized
True if FFmpeg has been initialized.
Definition SoundFileReader.hpp:389

MayaFlux::IO::SoundFileReader::decode_frames
std::vector< Kakshya::DataVariant > decode_frames(std::shared_ptr< FFmpegContext > ctx, uint64_t num_frames, uint64_t offset)
Decode a specific number of frames from the file.
Definition SoundFileReader.cpp:554

MayaFlux::IO::SoundFileReader::seek_internal
bool seek_internal(std::shared_ptr< FFmpegContext > &ctx, uint64_t frame_position)
Internal seek implementation.
Definition SoundFileReader.cpp:730

MayaFlux::IO::SoundFileReader::m_last_error
std::string m_last_error
Last error message encountered.
Definition SoundFileReader.hpp:297

MayaFlux::IO::SoundFileReader::extract_regions
void extract_regions(const std::shared_ptr< FFmpegContext > &ctx)
Extract region information from the file.
Definition SoundFileReader.cpp:397

MayaFlux::IO::SoundFileReader::get_read_position
std::vector< uint64_t > get_read_position() const override
Get the current read position in the file.
Definition SoundFileReader.cpp:708

MayaFlux::IO::SoundFileReader::set_error
void set_error(const std::string &error) const
Set the last error message.
Definition SoundFileReader.cpp:928

MayaFlux::IO::SoundFileReader::m_current_frame_position
std::atomic< uint64_t > m_current_frame_position
Current frame position for reading.
Definition SoundFileReader.hpp:312

MayaFlux::IO::SoundFileReader::extract_metadata
void extract_metadata(const std::shared_ptr< FFmpegContext > &ctx)
Extract metadata from the file.
Definition SoundFileReader.cpp:345

MayaFlux::IO::SoundFileReader::get_container_type
std::type_index get_container_type() const override
Get the C++ type of the container returned by this reader.
Definition SoundFileReader.hpp:206

MayaFlux::IO::SoundFileReader::setup_resampler
bool setup_resampler(const std::shared_ptr< FFmpegContext > &ctx)
Set up the FFmpeg resampler if needed.
Definition SoundFileReader.cpp:240

MayaFlux::IO::SoundFileReader::read_region
std::vector< Kakshya::DataVariant > read_region(const FileRegion &region) override
Read a specific region from the file.
Definition SoundFileReader.cpp:690

MayaFlux::IO::SoundFileReader::read_frames
std::vector< Kakshya::DataVariant > read_frames(uint64_t num_frames, uint64_t offset=0)
Read a specific number of frames from the file.
Definition SoundFileReader.cpp:515

MayaFlux::IO::SoundFileReader::m_audio_options
AudioReadOptions m_audio_options
Audio-specific read options.
Definition SoundFileReader.hpp:292

MayaFlux::IO::SoundFileReader::m_context
std::shared_ptr< FFmpegContext > m_context
Definition SoundFileReader.hpp:274

MayaFlux::IO::SoundFileReader::m_cached_metadata
std::optional< FileMetadata > m_cached_metadata
Cached file metadata.
Definition SoundFileReader.hpp:302

MayaFlux::IO::SoundFileReader::m_cached_regions
std::vector< FileRegion > m_cached_regions
Cached file regions (markers, loops, etc.).
Definition SoundFileReader.hpp:307

MayaFlux::IO::SoundFileReader::clear_error
void clear_error() const
Clear the last error message.
Definition SoundFileReader.cpp:934

MayaFlux::IO::SoundFileReader::~SoundFileReader
~SoundFileReader() override
Destroy the SoundFileReader object.
Definition SoundFileReader.cpp:94

MayaFlux::IO::SoundFileReader::get_data_type
std::type_index get_data_type() const override
Get the C++ type of the data returned by this reader.
Definition SoundFileReader.hpp:200

MayaFlux::IO::SoundFileReader::m_filepath
std::string m_filepath
Path to the currently open file.
Definition SoundFileReader.hpp:282

MayaFlux::IO::SoundFileReader::get_dimension_sizes
std::vector< uint64_t > get_dimension_sizes() const override
Get the size of each dimension (e.g., frames, channels).
Definition SoundFileReader.cpp:888

MayaFlux::IO::SoundFileReader::set_target_bit_depth
void set_target_bit_depth(uint32_t bit_depth)
Set the target bit depth (ignored, always outputs double).
Definition SoundFileReader.hpp:263

MayaFlux::IO::SoundFileReader::set_audio_options
void set_audio_options(AudioReadOptions options)
Set audio-specific read options.
Definition SoundFileReader.hpp:250

MayaFlux::IO::SoundFileReader::create_container
std::shared_ptr< Kakshya::SignalSourceContainer > create_container() override
Create a SignalSourceContainer for this file.
Definition SoundFileReader.cpp:796

MayaFlux::IO::SoundFileReader::seek
bool seek(const std::vector< uint64_t > &position) override
Seek to a specific position in the file.
Definition SoundFileReader.cpp:713

MayaFlux::IO::SoundFileReader::SoundFileReader
SoundFileReader()
Construct a new SoundFileReader object.
Definition SoundFileReader.cpp:89

MayaFlux::IO::SoundFileReader::deinterleave_data
std::vector< std::vector< double > > deinterleave_data(const std::vector< double > &interleaved, uint32_t channels)
Convert interleaved audio data to deinterleaved (planar) format.
Definition SoundFileReader.cpp:940

MayaFlux::IO::SoundFileReader::get_num_dimensions
size_t get_num_dimensions() const override
Get the number of dimensions in the audio data (typically 2: time, channel).
Definition SoundFileReader.cpp:883

MayaFlux::IO::SoundFileReader::get_metadata
std::optional< FileMetadata > get_metadata() const override
Get metadata for the currently open file.
Definition SoundFileReader.cpp:280

MayaFlux::IO::SoundFileReader::get_regions
std::vector< FileRegion > get_regions() const override
Get all regions (markers, loops, etc.) from the file.
Definition SoundFileReader.cpp:484

MayaFlux::IO::SoundFileReader::is_open
bool is_open() const override
Check if a file is currently open.
Definition SoundFileReader.cpp:230

MayaFlux::IO::SoundFileReader::m_options
FileReadOptions m_options
File read options used for this session.
Definition SoundFileReader.hpp:287

MayaFlux::IO::SoundFileReader::get_supported_extensions
std::vector< std::string > get_supported_extensions() const override
Get supported file extensions for this reader.
Definition SoundFileReader.cpp:899

MayaFlux::IO::SoundFileReader::initialize_ffmpeg
static void initialize_ffmpeg()
Initialize FFmpeg libraries (thread-safe, called automatically).
Definition SoundFileReader.cpp:99

MayaFlux::IO::SoundFileReader::set_target_sample_rate
void set_target_sample_rate(uint32_t sample_rate)
Set the target sample rate for resampling.
Definition SoundFileReader.hpp:256

MayaFlux::IO::SoundFileReader::s_ffmpeg_init_mutex
static std::mutex s_ffmpeg_init_mutex
Mutex for FFmpeg initialization.
Definition SoundFileReader.hpp:394

MayaFlux::IO::SoundFileReader
FFmpeg-based audio file reader for MayaFlux.
Definition SoundFileReader.hpp:99

MayaFlux::Kakshya::SoundFileContainer
File-backed audio container with complete streaming functionality.
Definition SoundFileContainer.hpp:27

MayaFlux::IO::AudioReadOptions
AudioReadOptions
Audio-specific reading options.
Definition SoundFileReader.hpp:21

MayaFlux::IO::AudioReadOptions::CONVERT_TO_MONO
@ CONVERT_TO_MONO

MayaFlux::IO::AudioReadOptions::NORMALIZE
@ NORMALIZE

MayaFlux::IO::AudioReadOptions::DEINTERLEAVE
@ DEINTERLEAVE

MayaFlux::IO::AudioReadOptions::NONE
@ NONE

MayaFlux::IO::FileReadOptions
FileReadOptions
Generic options for file reading behavior.
Definition FileReader.hpp:60

MayaFlux::IO::FileReadOptions::ALL
@ ALL
All options enabled.

MayaFlux::IO::FileReadOptions::NONE
@ NONE
No special options.

MayaFlux::IO::operator&
FileReadOptions operator&(FileReadOptions a, FileReadOptions b)
Definition FileReader.hpp:78

MayaFlux::IO::operator|
FileReadOptions operator|(FileReadOptions a, FileReadOptions b)
Definition FileReader.hpp:73

MayaFlux::IO
Definition Depot.hpp:14

MayaFlux::IO::FFmpegContext::operator=
FFmpegContext & operator=(const FFmpegContext &)=delete

MayaFlux::IO::FFmpegContext::channels
uint32_t channels
Definition SoundFileReader.hpp:52

MayaFlux::IO::FFmpegContext::audio_stream_index
int audio_stream_index
Definition SoundFileReader.hpp:49

MayaFlux::IO::FFmpegContext::swr_context
SwrContext * swr_context
Definition SoundFileReader.hpp:48

MayaFlux::IO::FFmpegContext::operator=
FFmpegContext & operator=(FFmpegContext &&)=delete

MayaFlux::IO::FFmpegContext::FFmpegContext
FFmpegContext(const FFmpegContext &)=delete

MayaFlux::IO::FFmpegContext::FFmpegContext
FFmpegContext()=default

MayaFlux::IO::FFmpegContext::FFmpegContext
FFmpegContext(FFmpegContext &&)=delete

MayaFlux::IO::FFmpegContext::codec_context
AVCodecContext * codec_context
Definition SoundFileReader.hpp:47

MayaFlux::IO::FFmpegContext::format_context
AVFormatContext * format_context
Definition SoundFileReader.hpp:46

MayaFlux::IO::FFmpegContext::~FFmpegContext
~FFmpegContext()
Definition SoundFileReader.cpp:20

MayaFlux::IO::FFmpegContext::total_frames
uint64_t total_frames
Definition SoundFileReader.hpp:50

MayaFlux::IO::FFmpegContext::is_valid
bool is_valid() const
Definition SoundFileReader.hpp:63

MayaFlux::IO::FFmpegContext::sample_rate
uint32_t sample_rate
Definition SoundFileReader.hpp:51

MayaFlux::IO::FFmpegContext
RAII wrapper for FFmpeg contexts with proper cleanup.
Definition SoundFileReader.hpp:45

MayaFlux::IO::FileRegion
Generic region descriptor for any file type.
Definition FileReader.hpp:90