Aegisub/aegisub/src/audio_renderer_spectrum.h

153 lines
5.6 KiB
C++

// Copyright (c) 2009, Niels Martin Hansen
// All rights reserved.
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are met:
//
// * Redistributions of source code must retain the above copyright notice,
// this list of conditions and the following disclaimer.
// * Redistributions in binary form must reproduce the above copyright notice,
// this list of conditions and the following disclaimer in the documentation
// and/or other materials provided with the distribution.
// * Neither the name of the Aegisub Group nor the names of its contributors
// may be used to endorse or promote products derived from this software
// without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
// ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
// INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
// CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
// ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
// POSSIBILITY OF SUCH DAMAGE.
//
// Aegisub Project http://www.aegisub.org/
//
// $Id$
/// @file audio_renderer_spectrum.h
/// @see audio_renderer_spectrum.cpp
/// @ingroup audio_ui
///
/// Calculate and render a frequency-power spectrum for PCM audio data.
#ifndef AGI_PRE
#include <stdint.h>
#include <vector>
#endif
#include "audio_renderer.h"
#include <libaegisub/scoped_ptr.h>
#ifdef WITH_FFTW3
#include <fftw3.h>
#endif
class AudioColorScheme;
class AudioSpectrumCache;
struct AudioSpectrumCacheBlockFactory;
/// @class AudioSpectrumRenderer
/// @brief Render frequency-power spectrum graphs for audio data.
///
/// Renders frequency-power spectrum graphs of PCM audio data using a derivation function
/// such as the fast fourier transform.
class AudioSpectrumRenderer : public AudioRendererBitmapProvider {
friend struct AudioSpectrumCacheBlockFactory;
/// Internal cache management for the spectrum
agi::scoped_ptr<AudioSpectrumCache> cache;
/// Colour table used for regular rendering
agi::scoped_ptr<AudioColorScheme> colors_normal;
/// Colour table used for rendering the audio selection
agi::scoped_ptr<AudioColorScheme> colors_selected;
/// Colour table used for rendering inactive lines
agi::scoped_ptr<AudioColorScheme> colors_inactive;
/// Binary logarithm of number of samples to use in deriving frequency-power data
size_t derivation_size;
/// Binary logarithm of number of samples between the start of derivations
size_t derivation_dist;
/// @brief Reset in response to changing audio provider
///
/// Overrides the OnSetProvider event handler in the base class, to reset things
/// when the audio provider is changed.
void OnSetProvider();
/// @brief Recreates the cache
///
/// To be called when the number of blocks in cache might have changed,
/// e.g. new audio provider or new resolution.
void RecreateCache();
/// @brief Fill a block with frequency-power data for a time range
/// @param block_index Index of the block to fill data for
/// @param[out] block Address to write the data to
void FillBlock(size_t block_index, float *block);
/// @brief Convert audio data to float range [-1;+1)
/// @param count Samples to convert
/// @param dest Buffer to fill
template<class T>
void ConvertToFloat(size_t count, T *dest);
#ifdef WITH_FFTW3
/// FFTW plan data
fftw_plan dft_plan;
/// Pre-allocated input array for FFTW
double *dft_input;
/// Pre-allocated output array for FFTW
fftw_complex *dft_output;
#else
/// Pre-allocated scratch area for doing FFT derivations
std::vector<float> fft_scratch;
#endif
/// Pre-allocated scratch area for storing raw audio data
std::vector<int16_t> audio_scratch;
/// Get the color scheme for a rendering style
const AudioColorScheme *GetColorScheme(AudioRenderingStyle style) const;
public:
/// @brief Constructor
/// @param color_scheme_name Name of the color scheme to use
AudioSpectrumRenderer(std::string const& color_scheme_name);
/// @brief Destructor
~AudioSpectrumRenderer();
/// @brief Render a range of audio spectrum
/// @param bmp [in,out] Bitmap to render into, also carries length information
/// @param start First column of pixel data in display to render
/// @param style Style to render audio in
void Render(wxBitmap &bmp, int start, AudioRenderingStyle style);
/// @brief Render blank area
void RenderBlank(wxDC &dc, const wxRect &rect, AudioRenderingStyle style);
/// @brief Set the derivation resolution
/// @param derivation_size Binary logarithm of number of samples to use in deriving frequency-power data
/// @param derivation_dist Binary logarithm of number of samples between the start of derivations
///
/// The derivations done will each use 2^derivation_size audio samples and at a distance
/// of 2^derivation_dist samples.
///
/// The derivation distance must be smaller than or equal to the size. If the distance
/// is specified too large, it will be clamped to the size.
void SetResolution(size_t derivation_size, size_t derivation_dist);
/// @brief Cleans up the cache
/// @param max_size Maximum size in bytes for the cache
void AgeCache(size_t max_size);
};