2022-05-23 15:04:34 +01:00
/* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
/*
Rubber Band Library
An audio time - stretching and pitch - shifting library .
Copyright 2007 - 2022 Particular Programs Ltd .
This program is free software ; you can redistribute it and / or
modify it under the terms of the GNU General Public License as
published by the Free Software Foundation ; either version 2 of the
License , or ( at your option ) any later version . See the file
COPYING included with this distribution for more information .
Alternatively , if you have a valid commercial licence for the
Rubber Band Library obtained by agreement with the copyright
holders , you may redistribute and / or modify it under the terms
described in that licence .
If you wish to distribute code using the Rubber Band Library
under terms other than those of the GNU General Public License ,
you must obtain a valid commercial licence before doing so .
*/
# include "R3StretcherImpl.h"
# include <array>
namespace RubberBand {
void
R3StretcherImpl : : setTimeRatio ( double ratio )
{
m_timeRatio = ratio ;
2022-05-23 17:59:40 +01:00
calculateHop ( ) ;
2022-05-23 15:04:34 +01:00
}
void
R3StretcherImpl : : setPitchScale ( double scale )
{
m_pitchScale = scale ;
2022-05-23 17:59:40 +01:00
calculateHop ( ) ;
}
void
R3StretcherImpl : : calculateHop ( )
{
double ratio = getEffectiveRatio ( ) ;
double proposedOuthop = 256 ;
if ( ratio > 1.0 ) {
double inhop = proposedOuthop / ratio ;
if ( inhop < 1.0 ) {
m_parameters . logger ( " WARNING: Extreme ratio yields ideal inhop < 1, results may be suspect " ) ;
m_inhop = 1 ;
} else {
m_inhop = int ( round ( inhop ) ) ;
}
} else {
double inhop = std : : min ( proposedOuthop / ratio , 340.0 ) ;
m_inhop = int ( round ( inhop ) ) ;
}
std : : ostringstream str ;
str < < " R3StretcherImpl::calculateHop: for effective ratio " < < ratio
< < " calculated (typical) inhop of " < < m_inhop < < std : : endl ;
m_parameters . logger ( str . str ( ) ) ;
2022-05-23 15:04:34 +01:00
}
double
R3StretcherImpl : : getTimeRatio ( ) const
{
return m_timeRatio ;
}
double
R3StretcherImpl : : getPitchScale ( ) const
{
return m_pitchScale ;
}
size_t
R3StretcherImpl : : getLatency ( ) const
{
return 0 ; //!!!
}
size_t
R3StretcherImpl : : getChannelCount ( ) const
{
return m_parameters . channels ;
}
void
R3StretcherImpl : : reset ( )
{
//!!!
}
size_t
R3StretcherImpl : : getSamplesRequired ( ) const
{
int longest = m_guideConfiguration . longestFftSize ;
size_t rs = m_channelData [ 0 ] - > inbuf - > getReadSpace ( ) ;
if ( rs < longest ) {
return longest - rs ;
} else {
return 0 ;
}
}
void
R3StretcherImpl : : process ( const float * const * input , size_t samples , bool final )
{
//!!! todo: final
2022-05-23 16:45:41 +01:00
2022-05-23 20:55:56 +01:00
//!!! m_parameters.logger("process called");
2022-05-23 16:45:41 +01:00
if ( final ) {
2022-05-23 20:55:56 +01:00
// m_parameters.logger("final = true");
2022-05-23 16:45:41 +01:00
m_draining = true ;
}
2022-05-23 15:04:34 +01:00
bool allConsumed = false ;
size_t ws = m_channelData [ 0 ] - > inbuf - > getWriteSpace ( ) ;
if ( samples > ws ) {
//!!! check this
m_parameters . logger ( " R3StretcherImpl::process: WARNING: Forced to increase input buffer size. Either setMaxProcessSize was not properly called or process is being called repeatedly without retrieve. " ) ;
size_t newSize = m_channelData [ 0 ] - > inbuf - > getSize ( ) - ws + samples ;
for ( int c = 0 ; c < m_parameters . channels ; + + c ) {
m_channelData [ c ] - > inbuf =
std : : unique_ptr < RingBuffer < float > >
( m_channelData [ c ] - > inbuf - > resized ( newSize ) ) ;
}
}
for ( int c = 0 ; c < m_parameters . channels ; + + c ) {
m_channelData [ c ] - > inbuf - > write ( input [ c ] , samples ) ;
}
consume ( ) ;
}
int
R3StretcherImpl : : available ( ) const
{
2022-05-23 20:55:56 +01:00
//!!! m_parameters.logger("available called");
2022-05-23 16:45:41 +01:00
int av = int ( m_channelData [ 0 ] - > outbuf - > getReadSpace ( ) ) ;
if ( av = = 0 & & m_draining ) return - 1 ;
else return av ;
2022-05-23 15:04:34 +01:00
}
size_t
R3StretcherImpl : : retrieve ( float * const * output , size_t samples ) const
{
2022-05-23 20:55:56 +01:00
//!!! m_parameters.logger("retrieve called");
2022-05-23 15:04:34 +01:00
size_t got = samples ;
for ( size_t c = 0 ; c < m_parameters . channels ; + + c ) {
size_t gotHere = m_channelData [ c ] - > outbuf - > read ( output [ c ] , got ) ;
if ( gotHere < got ) {
if ( c > 0 ) {
m_parameters . logger ( " R3StretcherImpl::retrieve: WARNING: channel imbalance detected " ) ;
}
got = gotHere ;
}
}
return got ;
}
void
R3StretcherImpl : : consume ( )
{
2022-05-23 17:59:40 +01:00
double ratio = getEffectiveRatio ( ) ;
2022-05-23 15:04:34 +01:00
int longest = m_guideConfiguration . longestFftSize ;
int classify = m_guideConfiguration . classificationFftSize ;
2022-05-23 17:59:40 +01:00
2022-05-24 12:00:54 +01:00
m_calculator - > setDebugLevel ( 3 ) ;
2022-05-23 17:59:40 +01:00
int outhop = m_calculator - > calculateSingle ( ratio ,
1.0 / m_pitchScale ,
1.f ,
m_inhop ,
longest ,
longest ) ;
2022-05-24 12:00:54 +01:00
std : : cout < < " outhop = " < < outhop < < std : : endl ;
2022-05-23 17:59:40 +01:00
double instantaneousRatio = double ( outhop ) / double ( m_inhop ) ;
2022-05-23 15:04:34 +01:00
2022-05-23 20:55:56 +01:00
while ( m_channelData . at ( 0 ) - > outbuf - > getWriteSpace ( ) > = outhop ) {
//!!! m_parameters.logger("consume looping");
2022-05-23 17:59:40 +01:00
2022-05-23 20:55:56 +01:00
int readSpace = m_channelData . at ( 0 ) - > inbuf - > getReadSpace ( ) ;
if ( readSpace < longest ) {
if ( m_draining ) {
if ( readSpace = = 0 ) {
break ;
}
} else {
break ;
}
2022-05-23 17:59:40 +01:00
}
2022-05-23 20:55:56 +01:00
2022-05-23 15:04:34 +01:00
for ( int c = 0 ; c < m_parameters . channels ; + + c ) {
2022-05-23 17:36:26 +01:00
auto cd = m_channelData . at ( c ) ;
2022-05-23 15:04:34 +01:00
auto longestScale = cd - > scales . at ( longest ) ;
2022-05-23 20:55:56 +01:00
auto buf = longestScale - > timeDomainFrame . data ( ) ;
if ( readSpace < longest ) {
v_zero ( buf , longest ) ;
cd - > inbuf - > peek ( buf , readSpace ) ;
} else {
cd - > inbuf - > peek ( buf , longest ) ;
}
2022-05-23 15:04:34 +01:00
for ( auto it : cd - > scales ) {
int fftSize = it . first ;
auto scale = it . second ;
if ( fftSize = = longest ) continue ;
int offset = ( longest - fftSize ) / 2 ;
m_scaleData . at ( fftSize ) - > analysisWindow . cut
2022-05-23 20:55:56 +01:00
( buf + offset , scale - > timeDomainFrame . data ( ) ) ;
2022-05-23 15:04:34 +01:00
}
2022-05-23 20:55:56 +01:00
m_scaleData . at ( longest ) - > analysisWindow . cut ( buf ) ;
2022-05-23 15:04:34 +01:00
for ( auto it : cd - > scales ) {
int fftSize = it . first ;
auto scale = it . second ;
m_scaleData . at ( fftSize ) - > fft . forwardPolar
( scale - > timeDomainFrame . data ( ) ,
scale - > mag . data ( ) ,
scale - > phase . data ( ) ) ;
2022-05-23 17:36:26 +01:00
v_scale ( scale - > mag . data ( ) , 1.f / float ( fftSize ) ,
scale - > mag . size ( ) ) ;
2022-05-23 15:04:34 +01:00
}
auto classifyScale = cd - > scales . at ( classify ) ;
cd - > prevSegmentation = cd - > segmentation ;
2022-05-23 20:55:56 +01:00
cd - > segmentation =
cd - > segmenter - > segment ( classifyScale - > mag . data ( ) ) ;
2022-05-23 15:04:34 +01:00
m_troughPicker . findNearestAndNextPeaks
( classifyScale - > mag . data ( ) , 3 , nullptr ,
classifyScale - > nextTroughs . data ( ) ) ;
2022-05-23 17:59:40 +01:00
m_guide . calculate ( instantaneousRatio ,
classifyScale - > mag . data ( ) ,
2022-05-23 15:04:34 +01:00
classifyScale - > nextTroughs . data ( ) ,
classifyScale - > prevMag . data ( ) ,
cd - > segmentation ,
cd - > prevSegmentation ,
BinSegmenter : : Segmentation ( ) , //!!!
cd - > guidance ) ;
}
for ( auto it : m_channelData [ 0 ] - > scales ) {
int fftSize = it . first ;
for ( int c = 0 ; c < m_parameters . channels ; + + c ) {
2022-05-23 17:36:26 +01:00
auto cd = m_channelData . at ( c ) ;
2022-05-23 15:04:34 +01:00
auto classifyScale = cd - > scales . at ( fftSize ) ;
m_channelAssembly . mag [ c ] = classifyScale - > mag . data ( ) ;
m_channelAssembly . phase [ c ] = classifyScale - > phase . data ( ) ;
m_channelAssembly . guidance [ c ] = & cd - > guidance ;
m_channelAssembly . outPhase [ c ] = classifyScale - > outPhase . data ( ) ;
}
m_scaleData . at ( fftSize ) - > guided . advance
( m_channelAssembly . outPhase . data ( ) ,
m_channelAssembly . mag . data ( ) ,
m_channelAssembly . phase . data ( ) ,
m_guideConfiguration ,
m_channelAssembly . guidance . data ( ) ,
2022-05-23 17:59:40 +01:00
m_inhop ,
2022-05-23 15:04:34 +01:00
outhop ) ;
}
for ( int c = 0 ; c < m_parameters . channels ; + + c ) {
2022-05-23 17:36:26 +01:00
auto cd = m_channelData . at ( c ) ;
for ( auto it : cd - > scales ) {
2022-05-23 15:04:34 +01:00
auto scale = it . second ;
int bufSize = scale - > bufSize ;
// copy to prevMag before filtering
v_copy ( scale - > prevMag . data ( ) , scale - > mag . data ( ) , bufSize ) ;
v_copy ( scale - > prevOutPhase . data ( ) , scale - > outPhase . data ( ) , bufSize ) ;
2022-05-23 16:45:41 +01:00
//!!! seems wasteful
2022-05-23 15:04:34 +01:00
for ( int i = 0 ; i < bufSize ; + + i ) {
scale - > phase [ i ] = princarg ( scale - > outPhase [ i ] ) ;
}
}
2022-05-23 17:36:26 +01:00
for ( const auto & band : cd - > guidance . fftBands ) {
int fftSize = band . fftSize ;
auto scale = cd - > scales . at ( fftSize ) ;
auto scaleData = m_scaleData . at ( fftSize ) ;
//!!! messy and v slow, but leave it until we've
//!!! discovered whether we need a window accumulator
//!!! (we probably do)
int analysisWindowSize = scaleData - > analysisWindow . getSize ( ) ;
int synthesisWindowSize = scaleData - > synthesisWindow . getSize ( ) ;
int offset = ( analysisWindowSize - synthesisWindowSize ) / 2 ;
float winscale = 0.f ;
for ( int i = 0 ; i < synthesisWindowSize ; + + i ) {
winscale + = scaleData - > analysisWindow . getValue ( i + offset ) *
scaleData - > synthesisWindow . getValue ( i ) ;
}
winscale = float ( outhop ) / winscale ;
2022-05-24 12:00:54 +01:00
double factor = m_parameters . sampleRate / double ( fftSize ) ;
2022-05-23 17:36:26 +01:00
for ( int i = 0 ; i < fftSize / 2 + 1 ; + + i ) {
double f = double ( i ) * factor ;
if ( f > = band . f0 & & f < band . f1 ) {
2022-05-24 12:00:54 +01:00
//!!! check the mod 2 bit from stretch-fn
2022-05-23 17:36:26 +01:00
scale - > mag [ i ] * = winscale ;
} else {
scale - > mag [ i ] = 0.f ;
}
}
}
for ( auto it : cd - > scales ) {
2022-05-23 15:04:34 +01:00
int fftSize = it . first ;
auto scale = it . second ;
auto scaleData = m_scaleData . at ( fftSize ) ;
2022-05-24 12:00:54 +01:00
2022-05-23 15:04:34 +01:00
scaleData - > fft . inversePolar ( scale - > mag . data ( ) ,
scale - > phase . data ( ) ,
scale - > timeDomainFrame . data ( ) ) ;
2022-05-23 17:36:26 +01:00
2022-05-23 16:45:41 +01:00
int synthesisWindowSize = scaleData - > synthesisWindow . getSize ( ) ;
2022-05-24 12:00:54 +01:00
int fromOffset = ( fftSize - synthesisWindowSize ) / 2 ;
int toOffset = ( m_guideConfiguration . longestFftSize -
synthesisWindowSize ) / 2 ;
2022-05-23 16:45:41 +01:00
scaleData - > synthesisWindow . cutAndAdd
2022-05-24 12:00:54 +01:00
( scale - > timeDomainFrame . data ( ) + fromOffset ,
scale - > accumulator . data ( ) + toOffset ) ;
2022-05-23 15:04:34 +01:00
}
2022-05-24 12:00:54 +01:00
auto mixptr = cd - > mixdown . data ( ) ;
v_zero ( mixptr , outhop ) ;
2022-05-23 15:04:34 +01:00
for ( auto it : cd - > scales ) {
auto scale = it . second ;
2022-05-24 12:00:54 +01:00
v_add ( mixptr , scale - > accumulator . data ( ) , outhop ) ;
2022-05-23 15:04:34 +01:00
}
2022-05-23 20:55:56 +01:00
2022-05-24 12:00:54 +01:00
cd - > outbuf - > write ( mixptr , outhop ) ;
for ( auto it : cd - > scales ) {
int fftSize = it . first ;
auto scale = it . second ;
auto accptr = scale - > accumulator . data ( ) ;
int n = scale - > accumulator . size ( ) - outhop ;
v_move ( accptr , accptr + outhop , n ) ;
v_zero ( accptr + n , outhop ) ;
}
2022-05-23 20:55:56 +01:00
if ( readSpace < m_inhop ) {
// This should happen only when draining
cd - > inbuf - > skip ( readSpace ) ;
} else {
cd - > inbuf - > skip ( m_inhop ) ;
}
2022-05-23 15:04:34 +01:00
}
}
}
}