libpromeki/audioformat_8h_source.html

#pragma once


#include <promeki/config.h>

#if PROMEKI_ENABLE_PROAV

#include <cstddef>

#include <cstdint>

#include <limits>

#include <type_traits>

#include <promeki/namespace.h>

#include <promeki/string.h>

#include <promeki/list.h>

#include <promeki/fourcc.h>

#include <promeki/audiocodec.h>

#include <promeki/result.h>

#include <promeki/system.h>

#include <promeki/datatype.h>


PROMEKI_NAMESPACE_BEGIN


class DataStream;


class AudioFormat {

        public:

                PROMEKI_DATATYPE(AudioFormat, DataTypeAudioFormat, 1)


                Error writeToStream(DataStream &s) const;

                template <uint32_t V> static Result<AudioFormat> readFromStream(DataStream &s);


                static constexpr int32_t MinS24 = -8388608;

                static constexpr int32_t MaxS24 = 8388607;

                static constexpr int32_t MinU24 = 0;

                static constexpr int32_t MaxU24 = 16777215;


                enum ID {

                        Invalid = 0,


                        // -- Interleaved PCM -------------------------------

                        PCMI_Float32LE = 1,

                        PCMI_Float32BE = 2,

                        PCMI_S8 = 3,

                        PCMI_U8 = 4,

                        PCMI_S16LE = 5,

                        PCMI_U16LE = 6,

                        PCMI_S16BE = 7,

                        PCMI_U16BE = 8,

                        PCMI_S24LE = 9,

                        PCMI_U24LE = 10,

                        PCMI_S24BE = 11,

                        PCMI_U24BE = 12,

                        PCMI_S32LE = 13,

                        PCMI_U32LE = 14,

                        PCMI_S32BE = 15,

                        PCMI_U32BE = 16,

                        // 24-bit data carried in a 32-bit container.  HB32 = data

                        // occupies the high 3 bytes of the word (low byte is 0);

                        // LB32 = data occupies the low 3 bytes (high byte is 0).

                        // Endianness applies to the 32-bit word as a whole, not

                        // the 24-bit data subset.

                        PCMI_S24LE_HB32 = 17,

                        PCMI_S24LE_LB32 = 18,

                        PCMI_S24BE_HB32 = 19,

                        PCMI_S24BE_LB32 = 20,

                        PCMI_U24LE_HB32 = 21,

                        PCMI_U24LE_LB32 = 22,

                        PCMI_U24BE_HB32 = 23,

                        PCMI_U24BE_LB32 = 24,


                        // -- Planar PCM ------------------------------------

                        PCMP_Float32LE = 32,

                        PCMP_Float32BE = 33,

                        PCMP_S8 = 34,

                        PCMP_U8 = 35,

                        PCMP_S16LE = 36,

                        PCMP_U16LE = 37,

                        PCMP_S16BE = 38,

                        PCMP_U16BE = 39,

                        PCMP_S24LE = 40,

                        PCMP_U24LE = 41,

                        PCMP_S24BE = 42,

                        PCMP_U24BE = 43,

                        PCMP_S32LE = 44,

                        PCMP_U32LE = 45,

                        PCMP_S32BE = 46,

                        PCMP_U32BE = 47,

                        // Planar 24-bit-in-32-bit container variants, mirroring

                        // the interleaved set above.

                        PCMP_S24LE_HB32 = 48,

                        PCMP_S24LE_LB32 = 49,

                        PCMP_S24BE_HB32 = 50,

                        PCMP_S24BE_LB32 = 51,

                        PCMP_U24LE_HB32 = 52,

                        PCMP_U24LE_LB32 = 53,

                        PCMP_U24BE_HB32 = 54,

                        PCMP_U24BE_LB32 = 55,


                        // -- Compressed ------------------------------------

                        Opus = 64,

                        AAC = 65,

                        FLAC = 66,

                        MP3 = 67,

                        AC3 = 68,


                        UserDefined = 1024

                };


                using IDList = ::promeki::List<ID>;


                static constexpr ID NativeFloat = System::isLittleEndian() ? PCMI_Float32LE : PCMI_Float32BE;


                struct Data {

                                ID           id = Invalid;

                                String       name;

                                String       desc;

                                size_t       bytesPerSample = 0;

                                size_t       bitsPerSample = 0;

                                bool         isSigned = false;

                                bool         isFloat = false;

                                bool         isPlanar = false;

                                bool         isBigEndian = false;

                                bool         compressed = false;

                                AudioCodec   audioCodec;

                                FourCC::List fourccList;

                                void (*samplesToFloat)(float *out, const uint8_t *in, size_t samples) = nullptr;

                                void (*floatToSamples)(uint8_t *out, const float *in, size_t samples) = nullptr;

                };


                static ID registerType();


                static void registerData(Data &&data);


                static IDList registeredIDs();


                static Result<AudioFormat> lookup(const String &name);


                static Result<AudioFormat> fromString(const String &name);


                static AudioFormat lookupByFourCC(const FourCC &fcc);


                inline AudioFormat(ID id = Invalid);


                bool isValid() const { return d != nullptr && d->id != Invalid; }


                ID id() const { return d->id; }


                const String &name() const { return d->name; }


                const String &desc() const { return d->desc; }


                size_t bytesPerSample() const { return d->bytesPerSample; }


                size_t bitsPerSample() const { return d->bitsPerSample; }


                bool isSigned() const { return d->isSigned; }


                bool isFloat() const { return d->isFloat; }


                bool isPlanar() const { return d->isPlanar; }


                bool isBigEndian() const { return d->isBigEndian; }


                bool isCompressed() const { return d->compressed; }


                const AudioCodec &audioCodec() const { return d->audioCodec; }


                const FourCC::List &fourccList() const { return d->fourccList; }


                void samplesToFloat(float *out, const uint8_t *in, size_t samples) const {

                        if (d->samplesToFloat != nullptr) d->samplesToFloat(out, in, samples);

                }


                void floatToSamples(uint8_t *out, const float *in, size_t samples) const {

                        if (d->floatToSamples != nullptr) d->floatToSamples(out, in, samples);

                }


                // -- Direct (no-float) format-to-format conversion --------

                //

                // The library tracks a per-(src,dst) registry of "direct"

                // converters that bypass the via-float intermediate step.

                // Direct converters are faster (one memory pass) and

                // additionally permit @ref isBitAccurateTo, which matters

                // when audio buffers carry non-PCM payloads (SMPTE 337M

                // data bursts, AES3 user bits, …) — those bytes survive

                // a direct integer-to-integer transform but are scrambled

                // by an int → float → int round-trip.


                using DirectConvertFn = void (*)(void *out, const void *in, size_t samples);


                static DirectConvertFn directConverter(ID src, ID dst);


                static bool isBitAccurate(ID src, ID dst);


                static void registerDirectConverter(ID src, ID dst, DirectConvertFn fn, bool bitAccurate);


                bool hasDirectConverterTo(const AudioFormat &dst) const {

                        return directConverter(id(), dst.id()) != nullptr;

                }


                bool isBitAccurateTo(const AudioFormat &dst) const { return isBitAccurate(id(), dst.id()); }


                Error convertTo(const AudioFormat &dst, void *out, const void *in, size_t samples,

                                float *scratch = nullptr) const;


                Error convertTo(const AudioFormat &dst, void *out, const void *in, size_t samplesPerChannel,

                                size_t channels, float *scratch = nullptr) const;


                bool operator==(const AudioFormat &o) const { return d == o.d; }


                bool operator!=(const AudioFormat &o) const { return d != o.d; }


                const String &toString() const { return d->name; }


                const Data *data() const { return d; }


                // -- Integer <-> normalized float conversion helpers -------

                // These are used by the registered PCM formats' sample

                // conversion functions and are exposed as static utilities

                // so user-registered formats can reuse them.


                template <typename IntegerType, IntegerType Min, IntegerType Max>

                static float integerToFloat(IntegerType value) {

                        static_assert(std::is_integral<IntegerType>::value, "IntegerType must be an integer.");

                        if constexpr (Min < 0) {

                                // Signed range: divide by max(|Min|, Max) so an

                                // integer 0 maps to exactly 0.0f.  Standard audio

                                // convention; preserves silence through int↔float

                                // round-trips, which the linear-interp asymmetric

                                // mapping does not (it pushes 0 to ~1/(Max-Min)

                                // and that DC bias derails sync detectors that

                                // expect zero-mean silence between codewords).

                                constexpr float scaleNeg = -static_cast<float>(Min);

                                constexpr float scalePos = static_cast<float>(Max);

                                constexpr float scale = scaleNeg > scalePos ? scaleNeg : scalePos;

                                return static_cast<float>(value) / scale;

                        } else {

                                constexpr float min = static_cast<float>(Min);

                                constexpr float max = static_cast<float>(Max);

                                return ((static_cast<float>(value) - min) * 2.0f / (max - min)) - 1.0f;

                        }

                }


                template <typename IntegerType> static float integerToFloat(IntegerType value) {

                        static_assert(std::is_integral<IntegerType>::value, "IntegerType must be an integer.");

                        return integerToFloat<IntegerType, std::numeric_limits<IntegerType>::min(),

                                              std::numeric_limits<IntegerType>::max()>(value);

                }


                template <typename IntegerType, IntegerType Min, IntegerType Max>

                static IntegerType floatToInteger(float value) {

                        static_assert(std::is_integral<IntegerType>::value, "IntegerType must be an integer.");

                        if (value <= -1.0f) return Min;

                        if (value >= 1.0f) return Max;

                        if constexpr (Min < 0) {

                                // Symmetric inverse of integerToFloat: scale by

                                // max(|Min|, Max) so 0.0f maps to 0 exactly and

                                // float→int→float round-trips zero without bias.

                                constexpr float scaleNeg = -static_cast<float>(Min);

                                constexpr float scalePos = static_cast<float>(Max);

                                constexpr float scale = scaleNeg > scalePos ? scaleNeg : scalePos;

                                return static_cast<IntegerType>(value * scale);

                        } else {

                                const float min = static_cast<float>(Min);

                                const float max = static_cast<float>(Max);

                                return static_cast<IntegerType>((value + 1.0f) * 0.5f * (max - min) + min);

                        }

                }


                template <typename IntegerType> static IntegerType floatToInteger(float value) {

                        static_assert(std::is_integral<IntegerType>::value, "IntegerType must be an integer.");

                        return floatToInteger<IntegerType, std::numeric_limits<IntegerType>::min(),

                                              std::numeric_limits<IntegerType>::max()>(value);

                }


                template <typename IntegerType, bool InputIsBigEndian>

                static void samplesToFloatImpl(float *out, const uint8_t *inbuf, size_t samples) {

                        static_assert(std::is_integral<IntegerType>::value, "IntegerType must be an integer.");

                        const IntegerType *in = reinterpret_cast<const IntegerType *>(inbuf);

                        for (size_t i = 0; i < samples; ++i) {

                                IntegerType val = *in++;

                                if constexpr (InputIsBigEndian != System::isBigEndian()) System::swapEndian(val);

                                *out++ = integerToFloat<IntegerType>(val);

                        }

                }


                template <typename IntegerType, bool OutputIsBigEndian>

                static void floatToSamplesImpl(uint8_t *outbuf, const float *in, size_t samples) {

                        static_assert(std::is_integral<IntegerType>::value, "IntegerType must be an integer.");

                        IntegerType *out = reinterpret_cast<IntegerType *>(outbuf);

                        for (size_t i = 0; i < samples; ++i) {

                                IntegerType val = floatToInteger<IntegerType>(*in++);

                                if constexpr (OutputIsBigEndian != System::isBigEndian()) System::swapEndian(val);

                                *out++ = val;

                        }

                }


        private:

                const Data        *d = nullptr;

                static const Data *lookupData(ID id);

};


inline AudioFormat::AudioFormat(ID id) : d(lookupData(id)) {}


PROMEKI_NAMESPACE_END


#endif // PROMEKI_ENABLE_PROAV

audiocodec.h

datatype.h

fourcc.h

list.h

namespace.h

result.h

string.h

system.h