Aegisub/src/audio_renderer_spectrum.h
EleonoreMizo f9c8a7f6aa Spectrum display improvement
– Selection of different frequency mappings for the spectrum display,
from linear (current default) to logarithmic.
– Field added in the preference page to select the frequency mapping
– New preference key to remember this setting:
Audio/Renderer/Spectrum/FreqCurve
– Consistent display with high sampling rates (> 48 kHz)
– Fixed time shift with high quality settings
2020-12-15 20:11:58 +01:00

172 lines
6.7 KiB
C++

// Copyright (c) 2009, Niels Martin Hansen
// All rights reserved.
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are met:
//
// * Redistributions of source code must retain the above copyright notice,
// this list of conditions and the following disclaimer.
// * Redistributions in binary form must reproduce the above copyright notice,
// this list of conditions and the following disclaimer in the documentation
// and/or other materials provided with the distribution.
// * Neither the name of the Aegisub Group nor the names of its contributors
// may be used to endorse or promote products derived from this software
// without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
// ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
// INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
// CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
// ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
// POSSIBILITY OF SUCH DAMAGE.
//
// Aegisub Project http://www.aegisub.org/
/// @file audio_renderer_spectrum.h
/// @see audio_renderer_spectrum.cpp
/// @ingroup audio_ui
///
/// Calculate and render a frequency-power spectrum for PCM audio data.
#include <cstdint>
#include <memory>
#include <vector>
#include "audio_renderer.h"
#ifdef WITH_FFTW3
#include <fftw3.h>
#endif
class AudioColorScheme;
class AudioSpectrumCache;
struct AudioSpectrumCacheBlockFactory;
/// @class AudioSpectrumRenderer
/// @brief Render frequency-power spectrum graphs for audio data.
///
/// Renders frequency-power spectrum graphs of PCM audio data using a derivation function
/// such as the fast fourier transform.
class AudioSpectrumRenderer final : public AudioRendererBitmapProvider {
friend struct AudioSpectrumCacheBlockFactory;
/// Internal cache management for the spectrum
std::unique_ptr<AudioSpectrumCache> cache;
/// Colour tables used for rendering
std::vector<AudioColorScheme> colors;
/// User-provided value for derivation_size
size_t derivation_size_user = 0;
/// User-provided value for derivation_dist
size_t derivation_dist_user = 0;
/// Maximum audible, displayed frequency. Avoids wasting the display space
/// with ultrasonic content at sampling rates > 40 kHz.
float max_freq = 20000.f;
/// Relative vertical position of the 1 kHz frequency, in (0 ; 1) open range
/// 0 = bottom of the display zone, 1 = top
/// The actual position, as displayed, is limited by the available mapping
/// curves (linear and log).
/// Values close to 0 will give a linear curve, and close to 1 a log curve.
float pos_fref = 1.0f / 3;
/// Reference frequency which vertical position is constant, Hz.
const float freq_ref = 1000.0f;
/// Binary logarithm of number of samples to use in deriving frequency-power data
/// This could differ from the user-provided value because the actual value
/// used in computations may be scaled, depending on the sampling rate.
size_t derivation_size = 0;
/// Binary logarithm of number of samples between the start of derivations
/// This could differ from the user-provided value because the actual value
/// used in computations may be scaled, depending on the sampling rate.
size_t derivation_dist = 0;
/// @brief Reset in response to changing audio provider
///
/// Overrides the OnSetProvider event handler in the base class, to reset things
/// when the audio provider is changed.
void OnSetProvider() override;
/// @brief Recreates the cache
///
/// To be called when the number of blocks in cache might have changed,
/// e.g. new audio provider or new resolution.
void RecreateCache();
/// @brief Fill a block with frequency-power data for a time range
/// @param block_index Index of the block to fill data for
/// @param[out] block Address to write the data to
void FillBlock(size_t block_index, float *block);
/// @brief Convert audio data to float range [-1;+1)
/// @param count Samples to convert
/// @param dest Buffer to fill
template<class T>
void ConvertToFloat(size_t count, T *dest);
/// @brief Updates the derivation_* after a derivation_*_user change.
void update_derivation_values ();
#ifdef WITH_FFTW3
/// FFTW plan data
fftw_plan dft_plan = nullptr;
/// Pre-allocated input array for FFTW
double *dft_input = nullptr;
/// Pre-allocated output array for FFTW
fftw_complex *dft_output = nullptr;
#else
/// Pre-allocated scratch area for doing FFT derivations
std::vector<float> fft_scratch;
#endif
/// Pre-allocated scratch area for storing raw audio data
std::vector<int16_t> audio_scratch;
public:
/// @brief Constructor
/// @param color_scheme_name Name of the color scheme to use
AudioSpectrumRenderer(std::string const& color_scheme_name);
/// @brief Destructor
~AudioSpectrumRenderer();
/// @brief Render a range of audio spectrum
/// @param bmp [in,out] Bitmap to render into, also carries length information
/// @param start First column of pixel data in display to render
/// @param style Style to render audio in
void Render(wxBitmap &bmp, int start, AudioRenderingStyle style) override;
/// @brief Render blank area
void RenderBlank(wxDC &dc, const wxRect &rect, AudioRenderingStyle style) override;
/// @brief Set the derivation resolution
/// @param derivation_size Binary logarithm of number of samples to use in deriving frequency-power data
/// @param derivation_dist Binary logarithm of number of samples between the start of derivations
///
/// The derivations done will each use 2^derivation_size audio samples and at a distance
/// of 2^derivation_dist samples.
///
/// The derivation distance must be smaller than or equal to the size. If the distance
/// is specified too large, it will be clamped to the size.
void SetResolution(size_t derivation_size, size_t derivation_dist);
/// @brief Set the vertical relative position of the reference frequency (1 kHz)
/// @param fref_pos_ Vertical position of the 1 kHz frequency. Between 0 and 1, boundaries excluded.
///
/// A value close to 0 gives a linear display, and close to 1 a logarithmic display.
void set_reference_frequency_position (float pos_fref_);
/// @brief Cleans up the cache
/// @param max_size Maximum size in bytes for the cache
void AgeCache(size_t max_size) override;
};