Files
librubberband/src/finer/R3StretcherImpl.cpp

351 lines
12 KiB
C++
Raw Normal View History

2022-05-23 15:04:34 +01:00
/* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
/*
Rubber Band Library
An audio time-stretching and pitch-shifting library.
Copyright 2007-2022 Particular Programs Ltd.
This program is free software; you can redistribute it and/or
modify it under the terms of the GNU General Public License as
published by the Free Software Foundation; either version 2 of the
License, or (at your option) any later version. See the file
COPYING included with this distribution for more information.
Alternatively, if you have a valid commercial licence for the
Rubber Band Library obtained by agreement with the copyright
holders, you may redistribute and/or modify it under the terms
described in that licence.
If you wish to distribute code using the Rubber Band Library
under terms other than those of the GNU General Public License,
you must obtain a valid commercial licence before doing so.
*/
#include "R3StretcherImpl.h"
#include <array>
namespace RubberBand {
void
R3StretcherImpl::setTimeRatio(double ratio)
{
m_timeRatio = ratio;
2022-05-23 17:59:40 +01:00
calculateHop();
2022-05-23 15:04:34 +01:00
}
void
R3StretcherImpl::setPitchScale(double scale)
{
m_pitchScale = scale;
2022-05-23 17:59:40 +01:00
calculateHop();
}
void
R3StretcherImpl::calculateHop()
{
double ratio = getEffectiveRatio();
double proposedOuthop = 256;
if (ratio > 1.0) {
double inhop = proposedOuthop / ratio;
if (inhop < 1.0) {
m_parameters.logger("WARNING: Extreme ratio yields ideal inhop < 1, results may be suspect");
m_inhop = 1;
} else {
m_inhop = int(round(inhop));
}
} else {
double inhop = std::min(proposedOuthop / ratio, 340.0);
m_inhop = int(round(inhop));
}
std::ostringstream str;
str << "R3StretcherImpl::calculateHop: for effective ratio " << ratio
<< " calculated (typical) inhop of " << m_inhop << std::endl;
m_parameters.logger(str.str());
2022-05-23 15:04:34 +01:00
}
double
R3StretcherImpl::getTimeRatio() const
{
return m_timeRatio;
}
double
R3StretcherImpl::getPitchScale() const
{
return m_pitchScale;
}
size_t
R3StretcherImpl::getLatency() const
{
return 0; //!!!
}
size_t
R3StretcherImpl::getChannelCount() const
{
return m_parameters.channels;
}
void
R3StretcherImpl::reset()
{
//!!!
}
size_t
R3StretcherImpl::getSamplesRequired() const
{
int longest = m_guideConfiguration.longestFftSize;
size_t rs = m_channelData[0]->inbuf->getReadSpace();
if (rs < longest) {
return longest - rs;
} else {
return 0;
}
}
void
R3StretcherImpl::process(const float *const *input, size_t samples, bool final)
{
//!!! todo: final
m_parameters.logger("process called");
if (final) {
m_parameters.logger("final = true");
m_draining = true;
}
2022-05-23 15:04:34 +01:00
bool allConsumed = false;
size_t ws = m_channelData[0]->inbuf->getWriteSpace();
if (samples > ws) {
//!!! check this
m_parameters.logger("R3StretcherImpl::process: WARNING: Forced to increase input buffer size. Either setMaxProcessSize was not properly called or process is being called repeatedly without retrieve.");
size_t newSize = m_channelData[0]->inbuf->getSize() - ws + samples;
for (int c = 0; c < m_parameters.channels; ++c) {
m_channelData[c]->inbuf =
std::unique_ptr<RingBuffer<float>>
(m_channelData[c]->inbuf->resized(newSize));
}
}
for (int c = 0; c < m_parameters.channels; ++c) {
m_channelData[c]->inbuf->write(input[c], samples);
}
consume();
}
int
R3StretcherImpl::available() const
{
m_parameters.logger("available called");
int av = int(m_channelData[0]->outbuf->getReadSpace());
if (av == 0 && m_draining) return -1;
else return av;
2022-05-23 15:04:34 +01:00
}
size_t
R3StretcherImpl::retrieve(float *const *output, size_t samples) const
{
m_parameters.logger("retrieve called");
2022-05-23 15:04:34 +01:00
size_t got = samples;
for (size_t c = 0; c < m_parameters.channels; ++c) {
size_t gotHere = m_channelData[c]->outbuf->read(output[c], got);
if (gotHere < got) {
if (c > 0) {
m_parameters.logger("R3StretcherImpl::retrieve: WARNING: channel imbalance detected");
}
got = gotHere;
}
}
return got;
}
void
R3StretcherImpl::consume()
{
2022-05-23 17:59:40 +01:00
double ratio = getEffectiveRatio();
2022-05-23 15:04:34 +01:00
int longest = m_guideConfiguration.longestFftSize;
int classify = m_guideConfiguration.classificationFftSize;
2022-05-23 17:59:40 +01:00
int outhop = m_calculator->calculateSingle(ratio,
1.0 / m_pitchScale,
1.f,
m_inhop,
longest,
longest);
double instantaneousRatio = double(outhop) / double(m_inhop);
2022-05-23 15:04:34 +01:00
while ((m_draining || m_channelData[0]->inbuf->getReadSpace() >= longest) &&
2022-05-23 15:04:34 +01:00
m_channelData[0]->outbuf->getWriteSpace() >= outhop) {
m_parameters.logger("consume looping");
2022-05-23 17:59:40 +01:00
if (m_draining && m_channelData[0]->inbuf->getReadSpace() == 0) {
break;
}
2022-05-23 15:04:34 +01:00
for (int c = 0; c < m_parameters.channels; ++c) {
2022-05-23 17:36:26 +01:00
auto cd = m_channelData.at(c);
2022-05-23 15:04:34 +01:00
auto longestScale = cd->scales.at(longest);
cd->inbuf->peek(longestScale->timeDomainFrame.data(), longest);
2022-05-23 15:04:34 +01:00
for (auto it: cd->scales) {
int fftSize = it.first;
auto scale = it.second;
if (fftSize == longest) continue;
int offset = (longest - fftSize) / 2;
m_scaleData.at(fftSize)->analysisWindow.cut
(longestScale->timeDomainFrame.data() + offset,
scale->timeDomainFrame.data());
}
m_scaleData.at(longest)->analysisWindow.cut
(longestScale->timeDomainFrame.data());
}
for (int c = 0; c < m_parameters.channels; ++c) {
2022-05-23 17:36:26 +01:00
auto cd = m_channelData.at(c);
2022-05-23 15:04:34 +01:00
for (auto it: cd->scales) {
int fftSize = it.first;
auto scale = it.second;
m_scaleData.at(fftSize)->fft.forwardPolar
(scale->timeDomainFrame.data(),
scale->mag.data(),
scale->phase.data());
2022-05-23 17:36:26 +01:00
v_scale(scale->mag.data(), 1.f / float(fftSize),
scale->mag.size());
2022-05-23 15:04:34 +01:00
}
}
for (int c = 0; c < m_parameters.channels; ++c) {
2022-05-23 17:36:26 +01:00
auto cd = m_channelData.at(c);
2022-05-23 15:04:34 +01:00
auto classifyScale = cd->scales.at(classify);
cd->prevSegmentation = cd->segmentation;
cd->segmentation = cd->segmenter->segment(classifyScale->mag.data());
m_troughPicker.findNearestAndNextPeaks
(classifyScale->mag.data(), 3, nullptr,
classifyScale->nextTroughs.data());
2022-05-23 17:59:40 +01:00
m_guide.calculate(instantaneousRatio,
classifyScale->mag.data(),
2022-05-23 15:04:34 +01:00
classifyScale->nextTroughs.data(),
classifyScale->prevMag.data(),
cd->segmentation,
cd->prevSegmentation,
BinSegmenter::Segmentation(), //!!!
cd->guidance);
}
for (auto it : m_channelData[0]->scales) {
int fftSize = it.first;
for (int c = 0; c < m_parameters.channels; ++c) {
2022-05-23 17:36:26 +01:00
auto cd = m_channelData.at(c);
2022-05-23 15:04:34 +01:00
auto classifyScale = cd->scales.at(fftSize);
m_channelAssembly.mag[c] = classifyScale->mag.data();
m_channelAssembly.phase[c] = classifyScale->phase.data();
m_channelAssembly.guidance[c] = &cd->guidance;
m_channelAssembly.outPhase[c] = classifyScale->outPhase.data();
}
m_scaleData.at(fftSize)->guided.advance
(m_channelAssembly.outPhase.data(),
m_channelAssembly.mag.data(),
m_channelAssembly.phase.data(),
m_guideConfiguration,
m_channelAssembly.guidance.data(),
2022-05-23 17:59:40 +01:00
m_inhop,
2022-05-23 15:04:34 +01:00
outhop);
}
for (int c = 0; c < m_parameters.channels; ++c) {
2022-05-23 17:36:26 +01:00
auto cd = m_channelData.at(c);
for (auto it : cd->scales) {
2022-05-23 15:04:34 +01:00
auto scale = it.second;
int bufSize = scale->bufSize;
// copy to prevMag before filtering
v_copy(scale->prevMag.data(), scale->mag.data(), bufSize);
v_copy(scale->prevOutPhase.data(), scale->outPhase.data(), bufSize);
//!!! seems wasteful
2022-05-23 15:04:34 +01:00
for (int i = 0; i < bufSize; ++i) {
scale->phase[i] = princarg(scale->outPhase[i]);
}
}
2022-05-23 17:36:26 +01:00
for (const auto &band : cd->guidance.fftBands) {
int fftSize = band.fftSize;
auto scale = cd->scales.at(fftSize);
auto scaleData = m_scaleData.at(fftSize);
double factor = m_parameters.sampleRate / double(fftSize);
//!!! messy and v slow, but leave it until we've
//!!! discovered whether we need a window accumulator
//!!! (we probably do)
int analysisWindowSize = scaleData->analysisWindow.getSize();
int synthesisWindowSize = scaleData->synthesisWindow.getSize();
int offset = (analysisWindowSize - synthesisWindowSize) / 2;
float winscale = 0.f;
for (int i = 0; i < synthesisWindowSize; ++i) {
winscale += scaleData->analysisWindow.getValue(i + offset) *
scaleData->synthesisWindow.getValue(i);
}
winscale = float(outhop) / winscale;
for (int i = 0; i < fftSize/2 + 1; ++i) {
double f = double(i) * factor;
if (f >= band.f0 && f < band.f1) {
scale->mag[i] *= winscale;
} else {
scale->mag[i] = 0.f;
}
}
}
for (auto it : cd->scales) {
2022-05-23 15:04:34 +01:00
int fftSize = it.first;
auto scale = it.second;
auto scaleData = m_scaleData.at(fftSize);
int bufSize = scale->bufSize;
scaleData->fft.inversePolar(scale->mag.data(),
scale->phase.data(),
scale->timeDomainFrame.data());
2022-05-23 17:36:26 +01:00
int synthesisWindowSize = scaleData->synthesisWindow.getSize();
int offset = (fftSize - synthesisWindowSize) / 2;
scaleData->synthesisWindow.cutAndAdd
(scale->timeDomainFrame.data() + offset,
scale->accumulator.data());
2022-05-23 15:04:34 +01:00
}
v_zero(cd->mixdown.data(), outhop);
for (auto it : cd->scales) {
auto scale = it.second;
auto &acc = scale->accumulator;
v_add(cd->mixdown.data(), acc.data(), outhop);
int n = acc.size() - outhop;
v_move(acc.data(), acc.data() + outhop, n);
v_zero(acc.data() + n, outhop);
}
2022-05-23 17:36:26 +01:00
cd->outbuf->write(cd->mixdown.data(), outhop);
2022-05-23 17:59:40 +01:00
cd->inbuf->skip(m_inhop);
2022-05-23 15:04:34 +01:00
}
}
}
}