/* libxtract feature extraction library * * Copyright (C) 2006 Jamie Bullock * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, * USA. */ /** \file xtract_scalar.h: declares functions that extract a feature as a single value from an input vector */ #ifndef XTRACT_SCALAR_H #define XTRACT_SCALAR_H #ifdef __cplusplus extern "C" { #endif /** * \defgroup scalar scalar extraction functions * * Functions that extract a feature as a single value from an input vector * * @{ */ void test(void); /** \brief Extract the mean of an input vector * * \param *data: a pointer to the first element * \param N: the number of array elements to be considered * \param *argv: a pointer to NULL * \param *result: the mean of N values from the array pointed to by *data */ int xtract_mean(const float *data, const int N, const void *argv, float *result); /** \brief Extract the variance of an input vector * * \param *data: a pointer to the first element in an array of floats * \param N: the number of elements to be considered * \param *argv: a pointer to a float representing the mean of the input vector * \param *result: the variance of N values from the array pointed to by *data */ int xtract_variance(const float *data, const int N, const void *argv, float *result); /** \brief Extract the deviation of an input vector * * \param *data: a pointer to the first element in an array of floats * \param N: the number of elements to be considered * \param *argv: a pointer to a float representing the variance of the input vector * \param *result: the deviation of N values from the array pointed to by *data */ int xtract_standard_deviation(const float *data, const int N, const void *argv, float *result); /** \brief Extract the average deviation of an input vector * * \param *data: a pointer to the first element in an array of floats * \param N: the number of elements to be considered * \param *argv: a pointer to a float representing the mean of the input vector * \param *result: the average deviation of N values from the array pointed to by *data */ int xtract_average_deviation(const float *data, const int N, const void *argv, float *result); /** \brief Extract the skewness of an input vector * * \param *data: a pointer to the first element in an array of floats * \param N: the number of elements to be considered * \param *argv: a pointer to an array of floats representing the mean and standard deviation of the input vector * \param *result: the skewness of N values from the array pointed to by *data */ int xtract_skewness(const float *data, const int N, const void *argv, float *result); /** \brief Extract the kurtosis of an input vector * * \param *data: a pointer to the first element in an array of floats * \param N: the number of elements to be considered * \param *argv: a pointer to an array of values representing the mean and standard deviation of the input vector * \param *result: the kurtosis of N values from the array pointed to by *data */ int xtract_kurtosis(const float *data, const int N, const void *argv, float *result); /** \brief Extract the mean of an input spectrum * * \param *data: a pointer to the first element in an array of floats representing the spectrum of an audio vector, (e.g. the array pointed to by *result from xtract_spectrum(), xtract_peak_spectrum() or xtract_harmonic_spectrum()). * \param N: the size of the array pointed to by *data * \param *argv: a pointer to NULL * \param *result: the mean of the spectrum pointed to by *data */ int xtract_spectral_mean(const float *data, const int N, const void *argv, float *result); /** \brief Extract the variance of an input spectrum * * \param *data: a pointer to the first element in an array of floats representing the spectrum of an audio vector, (e.g. the array pointed to by *result from xtract_spectrum(), xtract_peak_spectrum() or xtract_harmonic_spectrum()). * \param N: the number of elements to be considered * \param N: the size of the array pointed to by *data * \param *argv: a pointer to a float representing the spectral mean of the input spectrum * \param *result: the variance of the spectrum pointed to by *data */ int xtract_spectral_variance(const float *data, const int N, const void *argv, float *result); /** \brief Extract the deviation of an input spectrum * * \param *data: a pointer to the first element in an array of floats representing the spectrum of an audio vector, (e.g. the array pointed to by *result from xtract_spectrum(), xtract_peak_spectrum() or xtract_harmonic_spectrum()). * \param N: the size of the array pointed to by *data * \param *argv: a pointer to a float representing the spectral variance of the input spectrum * \param *result: the deviation of the spectrum pointed to by *data */ int xtract_spectral_standard_deviation(const float *data, const int N, const void *argv, float *result); /** \brief Extract the average deviation of an input spectrum * * \param *data: a pointer to the first element in an array of floats representing the spectrum of an audio vector, (e.g. the array pointed to by *result from xtract_spectrum(), xtract_peak_spectrum() or xtract_harmonic_spectrum()). * \param N: the size of the array pointed to by *data * \param *argv: a pointer to a float representing the spectral mean of the input spectrum * \param *result: the average deviation of the spectrum pointed to by *data */ int xtract_spectral_average_deviation(const float *data, const int N, const void *argv, float *result); /** \brief Extract the skewness of an input spectrum * * \param *data: a pointer to the first element in an array of floats representing the spectrum of an audio vector, (e.g. the array pointed to by *result from xtract_spectrum(), xtract_peak_spectrum() or xtract_harmonic_spectrum()). * \param N: the size of the array pointed to by *data * \param *argv: a pointer to an array of floats representing the spectral mean and spectral standard deviation of the input spectrum * \param *result: the skewness of the spectrum pointed to by *data */ int xtract_spectral_skewness(const float *data, const int N, const void *argv, float *result); /** \brief Extract the kurtosis of an input spectrum * * \param *data: a pointer to the first element in an array of floats representing the spectrum of an audio vector, (e.g. the array pointed to by *result from xtract_spectrum(), xtract_peak_spectrum() or xtract_harmonic_spectrum()). * \param N: the size of the array pointed to by *data * \param *argv: a pointer to an array of values representing the spectral mean and spectral standard deviation of the input spectrum * \param *result: the kurtosis of the spectrum pointed to by *data */ int xtract_spectral_kurtosis(const float *data, const int N, const void *argv, float *result); /** \brief Extract the centroid of an input vector * * \param *data: a pointer to the first element in an array of floats representing the spectrum of an audio vector, (e.g. the array pointed to by *result from xtract_spectrum(), xtract_peak_spectrum() or xtract_harmonic_spectrum()). * \param N: the number of elements to be considered * \param *argv: a pointer to NULL * \param *result: the centroid of the values pointed to by *data * * Note: for a more 'accurate' result *result from xtract_peak_spectrum() can be passed in. This gives the interpolated peak frequency locations. * */ int xtract_spectral_centroid(const float *data, const int N, const void *argv, float *result); /** \brief Calculate the Irregularity of an input vector using a method described by Krimphoff (1994) * * \param *data: a pointer to the first element in an array of floats representing the magnitude coefficients from the spectrum of an audio vector, (e.g. the first half of the array pointed to by *result from xtract_spectrum(). * \param N: the number of elements to be considered * \param *argv: a pointer to NULL * \param *result: the irregularity of N values from the array pointed to by *data */ int xtract_irregularity_k(const float *data, const int N, const void *argv, float *result); /** \brief Calculate the Irregularity of an input vector using a method described by Jensen (1999) * * \param *data: a pointer to the first element in an array of floats representing the magnitude coefficients from the spectrum of an audio vector, (e.g. the first half of the array pointed to by *result from xtract_spectrum(). * \param N: the number of elements to be considered * \param *argv: a pointer to NULL * \param *result: the irregularity of N values from the array pointed to by *data */ int xtract_irregularity_j(const float *data, const int N, const void *argv, float *result); /** \brief Calculate the Tristimulus of an input vector using a method described by Pollard and Jansson (1982) * * \param *data: a pointer to the first element in an array of floats representing the magnitude coefficients of the harmonic spectrum of an audio vector e.g. a pointer to the first half of the array pointed to by *result from xtract_harmonics(). The amplitudes of the peak spectrum (e.g. *result from xtract_peak_spectrum()) can be used if one wishes to consider all partials not just harmonics. * \param N: the number of elements to be considered * \param *argv: a pointer to NULL * \param *result: the tristimulus of N values from the array pointed to by *data * * These three functions provide the first, second and third order tristimulus formulae * */ int xtract_tristimulus_1(const float *data, const int N, const void *argv, float *result); int xtract_tristimulus_2(const float *data, const int N, const void *argv, float *result); int xtract_tristimulus_3(const float *data, const int N, const void *argv, float *result); /** \brief Extract the smoothness of an input vector using a method described by McAdams (1999) * * \param *data: a pointer to the first element in an array of floats representing the magnitude coefficients from the spectrum of an audio vector, (e.g. the first half of the array pointed to by *result from xtract_spectrum(). * \param N: the number of elements to be considered * \param *argv: a pointer to the first element of an array of integers containing the lower bound, upper bound, and pre-scaling factor, whereby array data in the range lower < n < upper will be pre-scaled by p before processing. * \param *result: the smoothness of N values from the array pointed to by *data */ int xtract_smoothness(const float *data, const int N, const void *argv, float *result); /** \brief Extract the spectral spread of an input vector using a method described by Casagrande(2005) * * \param *data: a pointer to the first element in an array of floats representing the magnitude coefficients from the spectrum of an audio vector, (e.g. the first half of the array pointed to by *result from xtract_spectrum(). * \param N: the number of elements to be considered * \param *argv: a pointer to a float corresponding to the spectral centroid * \param *result: the spectral spread of N values from the array pointed to by *data */ int xtract_spread(const float *data, const int N, const void *argv, float *result); /* Zero crossing rate */ /** \brief Extract the zero crossing rate of an input vector * * \param *data: a pointer to the first element in an array of floats * \param N: the number of elements to be considered * \param *argv: a pointer to NULL * \param *result: the zero crossing rate of N values from the array pointed to by *data */ int xtract_zcr(const float *data, const int N, const void *argv, float *result); /** \brief Extract the spectral rolloff of an input vector using a method described by Bee Suan Ong (2005) * * \param *data: a pointer to the first element in an array of floats representing the magnitude coefficients from the spectrum of an audio vector, (e.g. the first half of the array pointed to by *result from xtract_spectrum(). * \param N: the number of elements to be considered * \param *argv: a pointer to an array containing a float representing (samplerate / N ) and a float representing the threshold for rolloff, i.e. the percentile at which the rolloff is determined, expressed as a percentage, and * \param *result: the spectral rolloff in Hz of N values from the array pointed to by *data. This is the point in the spectrum below which argv[0] of the energy is distributed. */ int xtract_rolloff(const float *data, const int N, const void *argv, float *result); /** \brief Extract the 'total loudness' of an input vector using a method described by Moore, Glasberg et al (2005) * * \param *data: a pointer to the first element in an array of floats representing a set of BARK_BANDS bark coefficients * \param N: the number of coefficients to be considered * \param *argv: a pointer to NULL * \param *result: the total loudness of N values from the array pointed to by *data * * Note: if N = 1, the 'specific loudness' of the bark band pointed to by *data will be given by *result * */ int xtract_loudness(const float *data, const int N, const void *argv, float *result); /** \brief Extract the spectral flatness measure of an input vector, where the flatness measure (SFM) is defined as the ratio of the geometric mean to the arithmetic mean of a magnitude spectrum. * * \note The computation method used here is the most efficient by a significant margin, but suffers from precision problems due to the multiplication operationin the geometric mean calculation. This is particularly accute for larger values of N (>=256). However, as noted by Peeters (2003), the SFM should generally be computed on a small number of 'bands' rather than on the complete magnitude spectrum. It is therefore highly recommended that xtract_bands() is used prior to calling xtract_flatness(). * * \param *data: a pointer to the first element in an array of floats representing the magnitude coefficients from the spectrum of an audio vector, (e.g. the first half of the array pointed to by *result from xtract_spectrum(). Alternatively the magnitudes from a number of 'subbands' can be used by using *result from xtract_bands(). * \param N: the number of *data array elements to be considered * \param *argv: a pointer to NULL * \param *result: the flatness of N values from the array pointed to by *data */ int xtract_flatness(const float *data, const int N, const void *argv, float *result); /** \brief Extract the LOG spectral flatness measure of an input vector * * \param *data: a pointer to NULL. * \param N: not used - can safely be set to 0. * \param *argv: a pointer to a float represnting spectral flatness. * \param *result: the LOG spectral flatness of N values from the array pointed to by *data * * flatness_db = 10 * log10(flatness) * */ int xtract_flatness_db(const float *data, const int N, const void *argv, float *result); /** \brief Extract the tonality factor of an input vector using a method described by Peeters 2003 * * \param *data: a pointer to NULL. * \param N: not used - can safely be set to 0. * \param *argv: a pointer to the LOG spectral flatness measure of an audio vector (e.g. the output from xtract_flatness_db) * \param *result: the tonality factor of N values from the array pointed to by *data */ int xtract_tonality(const float *data, const int N, const void *argv, float *result); /** \brief Extract the noisiness of an input vector using a method described by Tae Hong Park (2000) * * \param *data: a pointer to NULL * \param N: * \param *argv: a pointer to an array containing a float represnting the number of harmonic partials in a spectrum, and a float representing the number of partials in a spectrum * \param *result: the noisiness coefficient as calculated from argv */ int xtract_noisiness(const float *data, const int N, const void *argv, float *result); /** \brief Extract the RMS amplitude of an input vector using a method described by Tae Hong Park (2000) * * \param *data: a pointer to the first element in an array of floats * \param N: the number of elements to be considered * \param *argv: a pointer to NULL * \param *result: the RMS amplitude of N values from the array pointed to by *data */ int xtract_rms_amplitude(const float *data, const int N, const void *argv, float *result); /** \brief Extract the Inharmonicity of an input vector * * \param *data: a pointer to the first element in an array of floats represeting a magnitude peak spectrum of size N/2, and a frequency spectrum of size N/2 (This is the output format of xtract_peak_spectrum()) * \param N: the number of elements to be considered * \param *argv: a pointer to a float representing the fundamental frequency of the input vector. * \param *result: the inharmonicity of N values from the array pointed to by *data */ int xtract_spectral_inharmonicity(const float *data, const int N, const void *argv, float *result); /** \brief Extract the spectral crest of an input vector using a method described by Peeters (2003) * * \param *data: a pointer to NULL * \param N: not used * \param *argv: a pointer to an array containing a float representing the maximum value in a spectrum, and a float representing the mean value of a spectrum * \param *result: the spectral crest of N values from the array pointed to by *data */ int xtract_crest(const float *data, const int N, const void *argv, float *result); /** \brief Extract the Spectral Power of an input vector using a method described by Bee Suan Ong (2005) * * \param *data: a pointer to the first element in an array of floats representing the magnitude coefficients from the spectrum of an audio vector, (e.g. the first half of the array pointed to by *result from xtract_spectrum(). * \param N: the number of elements to be considered * \param *argv: a pointer to NULL * \param *result: the spectral power of N values from the array pointed to by *data */ int xtract_power(const float *data, const int N, const void *argv, float *result); /* Odd to even harmonic ratio */ /** \brief Extract the Odd to even harmonic ratio of an input vector * * \param *data: a pointer to the first element in an array of floats representing the amplitudes of the harmonic spectrum of an audio vector. It is sufficient to pass in a pointer to the first half of the array pointed to by *result from xtract_harmonic_spectrum(). * \param N: the number of elements to be considered. If using the array pointed to by *result from xtract_harmonics, N should equal half the total array size i.e., just the amplitudes of the peaks. * \param *argv: a pointer to NULL * \param *result: the even/odd harmonic ratio of N values from the array pointed to by *data */ int xtract_odd_even_ratio(const float *data, const int N, const void *argv, float *result); /** \brief Extract the Sharpness of an input vector * * \param *data: a pointer to the first element in an array of floats representing the magnitude coefficients from the spectrum of an audio vector, (e.g. the first half of the array pointed to by *result from xtract_spectrum(). * \param N: the number of elements to be considered * \param *argv: a pointer to NULL * \param *result: the Sharpness of N values from the array pointed to by *data */ int xtract_sharpness(const float *data, const int N, const void *argv, float *result); /** \brief Extract the Slope of an input vector using a method described by Peeters(2003) * * \param *data: a pointer to the first element in an array of floats representing the spectrum of an audio vector, (e.g. the array pointed to by *result from xtract_spectrum(), xtract_peak_spectrum() or xtract_harmonic_spectrum()). * \param N: the number of elements to be considered * \param *argv: a pointer to NULL * \param *result: the Slope of N values from the array pointed to by *data */ int xtract_spectral_slope(const float *data, const int N, const void *argv, float *result); /** \brief Extract the value of the lowest value in an input vector * * \param *data: a pointer to the first element in an array of floats * \param N: the number of elements to be considered * \param *argv: a pointer to a float representing the lower limit for the search. i.e. (*result > *argv) returns 1. * \param *result: a pointer to a value representing the lowest component in *data that falls above a given threshold. * */ int xtract_lowest_value(const float *data, const int N, const void *argv, float *result); /** \brief Extract the value of the highest value in an input vector * * \param *data: a pointer to the first element in an array of floats * \param N: the number of elements to be considered * \param *argv: a pointer to NULL. * \param *result: a pointer to a value representing the highest component in *data. * */ int xtract_highest_value(const float *data, const int N, const void *argv, float *result); /** \brief Extract the sum of the values in an input vector * * \param *data: a pointer to the first element in an array of floats * \param N: the number of elements to be considered * \param *argv: a pointer to NULL. * \param *result: a pointer to a value representing the sum of all of the values pointed to by *data. * */ int xtract_sum(const float *data, const int N, const void *argv, float *result); /** \brief Extract the Pitch of an input vector using Harmonic Product Spectrum (HPS) analysis * * \warning {This function doesn't work properly} * * \param *data: a pointer to the first element in an array of floats representing the magnitude coefficients from the spectrum of an audio vector, (e.g. the first half of the array pointed to by *result from xtract_spectrum(). * \param N: the number of elements to be considered * \param *argv: a pointer to NULL * \param *result: the pitch of N values from the array pointed to by *data */ int xtract_hps(const float *data, const int N, const void *argv, float *result); /** \brief Extract the fundamental frequency of an input vector * * \param *data: a pointer to the first element in an array of floats representing an audio vector * \param N: the number of elements to be considered * \param *argv: a pointer to a float representing the audio sample rate * \param *result: the pitch of N values from the array pointed to by *data * * This algorithm is based on the AMDF, with peak and centre clipping. It would benefit from further improvements to improve noise robustness and overall efficiency * * It is based on suggestion by Robert Bristow-Johnson in a discussion on the comp.dsp mailing list, subject "Reference implementation of pitch detection" * */ int xtract_f0(const float *data, const int N, const void *argv, float *result); /** \brief Extract the fundamental frequency of an input vector * * \param *data: a pointer to the first element in an array of floats representing an audio vector * \param N: the number of elements to be considered * \param *argv: a pointer to a float representing the audio sample rate * \param *result: the pitch of N values from the array pointed to by *data * * This function wraps xtract_f0, but provides the frequency of the lowest partial in the peak spectrum if f0 can't be found. * */ int xtract_failsafe_f0(const float *data, const int N, const void *argv, float *result); /** \brief Extract the number of non-zero elements in an input vector * * \param *data: a pointer to the first element in an array of floats * \param N: the number of elements to be considered * \param *argv: not used * \param *result: the number of non-zero elements in the array pointed to by *data * */ int xtract_nonzero_count(const float *data, const int N, const void *argv, float *result); /** @} */ #ifdef __cplusplus } #endif #endif