src/AudioWaveformer.cpp

/**
 * @file
 * @brief Source file for AudioWaveformer class
 * @author Jonathan Thomas <jonathan@openshot.org>
 *
 * @ref License
 */

// Copyright (c) 2008-2022 OpenShot Studios, LLC
//
// SPDX-License-Identifier: LGPL-3.0-or-later

#include "AudioWaveformer.h"


using namespace std;
using namespace openshot;


// Default constructor
AudioWaveformer::AudioWaveformer(ReaderBase* new_reader) : reader(new_reader)
{

}

// Destructor
AudioWaveformer::~AudioWaveformer()
{

}

// Extract audio samples from any ReaderBase class
AudioWaveformData AudioWaveformer::ExtractSamples(int channel, int num_per_second, bool normalize) {
    AudioWaveformData data;

    if (reader) {
        // Open reader (if needed)
        bool does_reader_have_video = reader->info.has_video;
        if (!reader->IsOpen()) {
            reader->Open();
        }
        // Disable video for faster processing
        reader->info.has_video = false;

        int sample_rate = reader->info.sample_rate;
        int sample_divisor = sample_rate / num_per_second;
        int total_samples = num_per_second * (reader->info.duration + 1.0);
        int extracted_index = 0;

        // Resize and clear audio buffers
        data.resize(total_samples);
        data.zero(total_samples);

        // Loop through all frames
        int sample_index = 0;
        float samples_max = 0.0;
        float chunk_max = 0.0;
        float chunk_squared_sum = 0.0;

        // How many channels are we using
        int channel_count = 1;
        if (channel == -1) {
            channel_count = reader->info.channels;
        }

        for (auto f = 1; f <= reader->info.video_length; f++) {
            // Get next frame
            shared_ptr<openshot::Frame> frame = reader->GetFrame(f);

            // Cache channels for this frame, to reduce # of calls to frame->GetAudioSamples
            float* channels[channel_count];
            for (auto channel_index = 0; channel_index < reader->info.channels; channel_index++) {
                if (channel == channel_index || channel == -1) {
                    channels[channel_index] = frame->GetAudioSamples(channel_index);
                }
            }

            // Get sample value from a specific channel (or all channels)
            for (auto s = 0; s < frame->GetAudioSamplesCount(); s++) {
                for (auto channel_index = 0; channel_index < reader->info.channels; channel_index++) {
                    if (channel == channel_index || channel == -1) {
                        float *samples = channels[channel_index];
                        float rms_sample_value = std::sqrt(samples[s] * samples[s]);

                        // Accumulate sample averages
                        chunk_squared_sum += rms_sample_value;
                        chunk_max = std::max(chunk_max, rms_sample_value);
                    }
                }

                sample_index += 1;

                // Cut-off reached
                if (sample_index % sample_divisor == 0) {
                    float avg_squared_sum = chunk_squared_sum / (sample_divisor * channel_count);
                    data.max_samples[extracted_index] = chunk_max;
                    data.rms_samples[extracted_index] = avg_squared_sum;
                    extracted_index++;

                    // Track max/min values
                    samples_max = std::max(samples_max, chunk_max);

                    // reset sample total and index
                    sample_index = 0;
                    chunk_max = 0.0;
                    chunk_squared_sum = 0.0;
                }
            }
        }

        // Scale all values to the -1 to +1 range (regardless of how small or how large the
        // original audio sample values are)
        if (normalize) {
            float scale = 1.0f / samples_max;
            data.scale(total_samples, scale);
        }

        // Resume previous has_video value
        reader->info.has_video = does_reader_have_video;
    }


    return data;
}
Initial commit of AudioWaveformer class, which is designed to iterate any ReaderBase, and return a reduced "average" sample set - more useful for generating waveforms - for example, reduce a 44100 samples per second down to 20 samples per second. 2022-10-30 22:04:19 -05:00			`/**`
			`* @file`
			`* @brief Source file for AudioWaveformer class`
			`* @author Jonathan Thomas <jonathan@openshot.org>`
			`*`
			`* @ref License`
			`*/`

			`// Copyright (c) 2008-2022 OpenShot Studios, LLC`
			`//`
			`// SPDX-License-Identifier: LGPL-3.0-or-later`

			`#include "AudioWaveformer.h"`


			`using namespace std;`
			`using namespace openshot;`


			`// Default constructor`
			`AudioWaveformer::AudioWaveformer(ReaderBase* new_reader) : reader(new_reader)`
			`{`

			`}`

			`// Destructor`
			`AudioWaveformer::~AudioWaveformer()`
			`{`

			`}`

			`// Extract audio samples from any ReaderBase class`
Improvements to AudioWaveformer to use RMS (Root Mean Square), and return both average RMS and max RMS for graphing, including some new unit tests. 2022-11-01 15:17:03 -05:00			`AudioWaveformData AudioWaveformer::ExtractSamples(int channel, int num_per_second, bool normalize) {`
			`AudioWaveformData data;`
Initial commit of AudioWaveformer class, which is designed to iterate any ReaderBase, and return a reduced "average" sample set - more useful for generating waveforms - for example, reduce a 44100 samples per second down to 20 samples per second. 2022-10-30 22:04:19 -05:00
			`if (reader) {`
			`// Open reader (if needed)`
			`bool does_reader_have_video = reader->info.has_video;`
			`if (!reader->IsOpen()) {`
			`reader->Open();`
			`}`
			`// Disable video for faster processing`
			`reader->info.has_video = false;`

			`int sample_rate = reader->info.sample_rate;`
			`int sample_divisor = sample_rate / num_per_second;`
			`int total_samples = num_per_second * (reader->info.duration + 1.0);`
			`int extracted_index = 0;`

Improvements to AudioWaveformer to use RMS (Root Mean Square), and return both average RMS and max RMS for graphing, including some new unit tests. 2022-11-01 15:17:03 -05:00			`// Resize and clear audio buffers`
			`data.resize(total_samples);`
			`data.zero(total_samples);`
Initial commit of AudioWaveformer class, which is designed to iterate any ReaderBase, and return a reduced "average" sample set - more useful for generating waveforms - for example, reduce a 44100 samples per second down to 20 samples per second. 2022-10-30 22:04:19 -05:00
			`// Loop through all frames`
			`int sample_index = 0;`
			`float samples_max = 0.0;`
Improvements to AudioWaveformer to use RMS (Root Mean Square), and return both average RMS and max RMS for graphing, including some new unit tests. 2022-11-01 15:17:03 -05:00			`float chunk_max = 0.0;`
			`float chunk_squared_sum = 0.0;`

			`// How many channels are we using`
			`int channel_count = 1;`
			`if (channel == -1) {`
			`channel_count = reader->info.channels;`
			`}`
Initial commit of AudioWaveformer class, which is designed to iterate any ReaderBase, and return a reduced "average" sample set - more useful for generating waveforms - for example, reduce a 44100 samples per second down to 20 samples per second. 2022-10-30 22:04:19 -05:00
			`for (auto f = 1; f <= reader->info.video_length; f++) {`
			`// Get next frame`
			`shared_ptr<openshot::Frame> frame = reader->GetFrame(f);`

Some performance optimizations. to reduce # of calls to GetAudioSamples() 2022-11-01 16:48:37 -05:00			`// Cache channels for this frame, to reduce # of calls to frame->GetAudioSamples`
			`float* channels[channel_count];`
			`for (auto channel_index = 0; channel_index < reader->info.channels; channel_index++) {`
			`if (channel == channel_index \|\| channel == -1) {`
			`channels[channel_index] = frame->GetAudioSamples(channel_index);`
			`}`
			`}`

Improvements to AudioWaveformer to use RMS (Root Mean Square), and return both average RMS and max RMS for graphing, including some new unit tests. 2022-11-01 15:17:03 -05:00			`// Get sample value from a specific channel (or all channels)`
Initial commit of AudioWaveformer class, which is designed to iterate any ReaderBase, and return a reduced "average" sample set - more useful for generating waveforms - for example, reduce a 44100 samples per second down to 20 samples per second. 2022-10-30 22:04:19 -05:00			`for (auto s = 0; s < frame->GetAudioSamplesCount(); s++) {`
Improvements to AudioWaveformer to use RMS (Root Mean Square), and return both average RMS and max RMS for graphing, including some new unit tests. 2022-11-01 15:17:03 -05:00			`for (auto channel_index = 0; channel_index < reader->info.channels; channel_index++) {`
			`if (channel == channel_index \|\| channel == -1) {`
Some performance optimizations. to reduce # of calls to GetAudioSamples() 2022-11-01 16:48:37 -05:00			`float *samples = channels[channel_index];`
Improvements to AudioWaveformer to use RMS (Root Mean Square), and return both average RMS and max RMS for graphing, including some new unit tests. 2022-11-01 15:17:03 -05:00			`float rms_sample_value = std::sqrt(samples[s] * samples[s]);`

			`// Accumulate sample averages`
			`chunk_squared_sum += rms_sample_value;`
			`chunk_max = std::max(chunk_max, rms_sample_value);`
			`}`
			`}`

Initial commit of AudioWaveformer class, which is designed to iterate any ReaderBase, and return a reduced "average" sample set - more useful for generating waveforms - for example, reduce a 44100 samples per second down to 20 samples per second. 2022-10-30 22:04:19 -05:00			`sample_index += 1;`

			`// Cut-off reached`
			`if (sample_index % sample_divisor == 0) {`
Improvements to AudioWaveformer to use RMS (Root Mean Square), and return both average RMS and max RMS for graphing, including some new unit tests. 2022-11-01 15:17:03 -05:00			`float avg_squared_sum = chunk_squared_sum / (sample_divisor * channel_count);`
			`data.max_samples[extracted_index] = chunk_max;`
			`data.rms_samples[extracted_index] = avg_squared_sum;`
Initial commit of AudioWaveformer class, which is designed to iterate any ReaderBase, and return a reduced "average" sample set - more useful for generating waveforms - for example, reduce a 44100 samples per second down to 20 samples per second. 2022-10-30 22:04:19 -05:00			`extracted_index++;`

			`// Track max/min values`
Improvements to AudioWaveformer to use RMS (Root Mean Square), and return both average RMS and max RMS for graphing, including some new unit tests. 2022-11-01 15:17:03 -05:00			`samples_max = std::max(samples_max, chunk_max);`
Initial commit of AudioWaveformer class, which is designed to iterate any ReaderBase, and return a reduced "average" sample set - more useful for generating waveforms - for example, reduce a 44100 samples per second down to 20 samples per second. 2022-10-30 22:04:19 -05:00
			`// reset sample total and index`
			`sample_index = 0;`
Improvements to AudioWaveformer to use RMS (Root Mean Square), and return both average RMS and max RMS for graphing, including some new unit tests. 2022-11-01 15:17:03 -05:00			`chunk_max = 0.0;`
			`chunk_squared_sum = 0.0;`
Initial commit of AudioWaveformer class, which is designed to iterate any ReaderBase, and return a reduced "average" sample set - more useful for generating waveforms - for example, reduce a 44100 samples per second down to 20 samples per second. 2022-10-30 22:04:19 -05:00			`}`
			`}`
			`}`

			`// Scale all values to the -1 to +1 range (regardless of how small or how large the`
			`// original audio sample values are)`
			`if (normalize) {`
Improvements to AudioWaveformer to use RMS (Root Mean Square), and return both average RMS and max RMS for graphing, including some new unit tests. 2022-11-01 15:17:03 -05:00			`float scale = 1.0f / samples_max;`
			`data.scale(total_samples, scale);`
Initial commit of AudioWaveformer class, which is designed to iterate any ReaderBase, and return a reduced "average" sample set - more useful for generating waveforms - for example, reduce a 44100 samples per second down to 20 samples per second. 2022-10-30 22:04:19 -05:00			`}`

			`// Resume previous has_video value`
			`reader->info.has_video = does_reader_have_video;`
			`}`

Improvements to AudioWaveformer to use RMS (Root Mean Square), and return both average RMS and max RMS for graphing, including some new unit tests. 2022-11-01 15:17:03 -05:00
			`return data;`
Initial commit of AudioWaveformer class, which is designed to iterate any ReaderBase, and return a reduced "average" sample set - more useful for generating waveforms - for example, reduce a 44100 samples per second down to 20 samples per second. 2022-10-30 22:04:19 -05:00			`}`