Files
librubberband/src/finer/R3StretcherImpl.h

233 lines
8.2 KiB
C
Raw Normal View History

2022-05-18 17:51:20 +01:00
/* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
/*
Rubber Band Library
An audio time-stretching and pitch-shifting library.
Copyright 2007-2022 Particular Programs Ltd.
This program is free software; you can redistribute it and/or
modify it under the terms of the GNU General Public License as
published by the Free Software Foundation; either version 2 of the
License, or (at your option) any later version. See the file
COPYING included with this distribution for more information.
Alternatively, if you have a valid commercial licence for the
Rubber Band Library obtained by agreement with the copyright
holders, you may redistribute and/or modify it under the terms
described in that licence.
If you wish to distribute code using the Rubber Band Library
under terms other than those of the GNU General Public License,
you must obtain a valid commercial licence before doing so.
*/
#ifndef RUBBERBAND_R3_STRETCHERIMPL_H
#define RUBBERBAND_R3_STRETCHERIMPL_H
#include "BinSegmenter.h"
2022-05-19 16:31:21 +01:00
#include "Guide.h"
#include "Peak.h"
2022-05-20 15:29:52 +01:00
#include "PhaseAdvance.h"
2022-05-18 17:51:20 +01:00
2022-05-23 17:59:40 +01:00
#include "../common/StretchCalculator.h"
#include "../common/FFT.h"
2022-05-20 15:29:52 +01:00
#include "../common/FixedVector.h"
#include "../common/Allocators.h"
2022-05-20 15:29:52 +01:00
#include "../common/Window.h"
2022-05-19 13:13:47 +01:00
2022-05-20 16:48:44 +01:00
#include <map>
#include <memory>
#include <functional>
2022-05-18 17:51:20 +01:00
namespace RubberBand
{
class R3StretcherImpl
{
public:
2022-05-20 16:48:44 +01:00
struct Parameters {
double sampleRate;
int channels;
std::function<void(const std::string &)> logger;
Parameters(double _sampleRate, int _channels,
std::function<void(const std::string &)> _log = &logCerr) :
sampleRate(_sampleRate), channels(_channels), logger(_log) { }
};
2022-05-23 17:59:40 +01:00
R3StretcherImpl(Parameters parameters,
double initialTimeRatio,
double initialPitchScale) :
2022-05-20 16:48:44 +01:00
m_parameters(parameters),
2022-05-23 17:59:40 +01:00
m_timeRatio(initialTimeRatio),
m_pitchScale(initialPitchScale),
m_guide(Guide::Parameters(m_parameters.sampleRate, parameters.logger)),
2022-05-23 15:04:34 +01:00
m_guideConfiguration(m_guide.getConfiguration()),
m_channelAssembly(m_parameters.channels),
m_troughPicker(m_guideConfiguration.classificationFftSize / 2 + 1),
2022-05-23 17:59:40 +01:00
m_inhop(1),
m_draining(false)
2022-05-20 16:48:44 +01:00
{
BinSegmenter::Parameters segmenterParameters
(m_guideConfiguration.classificationFftSize,
m_parameters.sampleRate);
BinClassifier::Parameters classifierParameters
(m_guideConfiguration.classificationFftSize / 2 + 1,
9, 1, 10, 2.0, 2.0, 1.0e-7);
2022-05-23 15:04:34 +01:00
2022-05-20 16:48:44 +01:00
int ringBufferSize = m_guideConfiguration.longestFftSize * 2;
2022-05-23 15:04:34 +01:00
2022-05-20 16:48:44 +01:00
for (int c = 0; c < m_parameters.channels; ++c) {
m_channelData.push_back(std::make_shared<ChannelData>
(segmenterParameters,
classifierParameters,
ringBufferSize));
for (auto band: m_guideConfiguration.fftBandLimits) {
int fftSize = band.fftSize;
m_channelData[c]->scales[fftSize] =
std::make_shared<ChannelScaleData>
(fftSize, m_guideConfiguration.longestFftSize);
2022-05-20 16:48:44 +01:00
}
}
2022-05-23 15:04:34 +01:00
for (auto band: m_guideConfiguration.fftBandLimits) {
int fftSize = band.fftSize;
GuidedPhaseAdvance::Parameters guidedParameters
(fftSize, m_parameters.sampleRate, m_parameters.channels,
m_parameters.logger);
m_scaleData[fftSize] = std::make_shared<ScaleData>(guidedParameters);
}
2022-05-23 17:59:40 +01:00
m_calculator = std::unique_ptr<StretchCalculator>
(new StretchCalculator(int(round(m_parameters.sampleRate)), //!!! which is a double...
1, false)); // no fixed inputIncrement
calculateHop();
2022-05-20 16:48:44 +01:00
}
~R3StretcherImpl() { }
2022-05-18 17:51:20 +01:00
void reset();
void setTimeRatio(double ratio);
void setPitchScale(double scale);
double getTimeRatio() const;
double getPitchScale() const;
2022-05-23 15:04:34 +01:00
size_t getSamplesRequired() const;
void process(const float *const *input, size_t samples, bool final);
int available() const;
size_t retrieve(float *const *output, size_t samples) const;
size_t getLatency() const;
size_t getChannelCount() const;
2022-05-18 17:51:20 +01:00
protected:
struct ChannelScaleData {
int fftSize;
2022-05-20 15:29:52 +01:00
int bufSize; // size of every freq-domain array here: fftSize/2 + 1
2022-05-23 15:04:34 +01:00
//!!! review later which of these we are actually using!
FixedVector<double> timeDomainFrame;
FixedVector<double> mag;
FixedVector<double> phase;
2022-05-23 15:04:34 +01:00
FixedVector<double> outPhase; //!!! "advanced"?
FixedVector<int> nextTroughs; //!!! not used in every scale
FixedVector<double> prevMag; //!!! not used in every scale
2022-05-20 15:29:52 +01:00
FixedVector<double> prevOutPhase;
FixedVector<double> accumulator;
2022-05-18 17:51:20 +01:00
ChannelScaleData(int _fftSize, int _longestFftSize) :
2022-05-23 15:04:34 +01:00
fftSize(_fftSize),
bufSize(fftSize/2 + 1),
timeDomainFrame(fftSize, 0.f),
mag(bufSize, 0.f),
phase(bufSize, 0.f),
outPhase(bufSize, 0.f),
nextTroughs(bufSize, 0),
prevMag(bufSize, 0.f),
prevOutPhase(bufSize, 0.f),
accumulator(_longestFftSize, 0.f)
2022-05-20 15:29:52 +01:00
{ }
2022-05-18 17:51:20 +01:00
private:
ChannelScaleData(const ChannelScaleData &) =delete;
ChannelScaleData &operator=(const ChannelScaleData &) =delete;
};
2022-05-19 17:28:38 +01:00
2022-05-18 17:51:20 +01:00
struct ChannelData {
std::map<int, std::shared_ptr<ChannelScaleData>> scales;
2022-05-19 09:16:13 +01:00
std::unique_ptr<BinSegmenter> segmenter;
BinSegmenter::Segmentation segmentation;
BinSegmenter::Segmentation prevSegmentation;
BinSegmenter::Segmentation nextSegmentation;
2022-05-19 16:31:21 +01:00
Guide::Guidance guidance;
FixedVector<double> mixdown;
2022-05-23 15:04:34 +01:00
std::unique_ptr<RingBuffer<float>> inbuf;
std::unique_ptr<RingBuffer<float>> outbuf;
2022-05-20 16:48:44 +01:00
ChannelData(BinSegmenter::Parameters segmenterParameters,
BinClassifier::Parameters classifierParameters,
int ringBufferSize) :
scales(),
segmenter(new BinSegmenter(segmenterParameters,
classifierParameters)),
segmentation(), prevSegmentation(), nextSegmentation(),
mixdown(ringBufferSize, 0.f), //!!! could be shorter (bound is the max fft size I think)
2022-05-23 15:04:34 +01:00
inbuf(new RingBuffer<float>(ringBufferSize)),
outbuf(new RingBuffer<float>(ringBufferSize)) { }
};
struct ChannelAssembly {
// Vectors of bare pointers, used to package container data
// from different channels into arguments for PhaseAdvance
FixedVector<double *> mag;
FixedVector<double *> phase;
2022-05-23 15:04:34 +01:00
FixedVector<Guide::Guidance *> guidance;
FixedVector<double *> outPhase;
ChannelAssembly(int channels) :
mag(channels, nullptr), phase(channels, nullptr),
guidance(channels, nullptr), outPhase(channels, nullptr) { }
2022-05-18 17:51:20 +01:00
};
2022-05-20 15:29:52 +01:00
2022-05-23 15:04:34 +01:00
struct ScaleData {
FFT fft;
Window<double> analysisWindow;
Window<double> synthesisWindow;
2022-05-23 15:04:34 +01:00
GuidedPhaseAdvance guided;
ScaleData(GuidedPhaseAdvance::Parameters guidedParameters) :
fft(guidedParameters.fftSize),
analysisWindow(HannWindow, guidedParameters.fftSize),
synthesisWindow(HannWindow, guidedParameters.fftSize/2),
guided(guidedParameters) { }
};
2022-05-20 16:48:44 +01:00
Parameters m_parameters;
2022-05-20 15:29:52 +01:00
double m_timeRatio;
double m_pitchScale;
2022-05-23 17:59:40 +01:00
2022-05-20 16:48:44 +01:00
std::vector<std::shared_ptr<ChannelData>> m_channelData;
2022-05-23 15:04:34 +01:00
std::map<int, std::shared_ptr<ScaleData>> m_scaleData;
2022-05-19 17:28:38 +01:00
Guide m_guide;
Guide::Configuration m_guideConfiguration;
2022-05-23 15:04:34 +01:00
ChannelAssembly m_channelAssembly;
Peak<double, std::less<double>> m_troughPicker;
2022-05-23 17:59:40 +01:00
std::unique_ptr<StretchCalculator> m_calculator;
int m_inhop;
bool m_draining;
2022-05-20 16:48:44 +01:00
2022-05-23 15:04:34 +01:00
void consume();
2022-05-23 17:59:40 +01:00
void calculateHop();
double getEffectiveRatio() const {
return m_timeRatio * m_pitchScale;
}
2022-05-23 15:04:34 +01:00
2022-05-20 16:48:44 +01:00
static void logCerr(const std::string &message) {
std::cerr << "RubberBandStretcher: " << message << std::endl;
}
2022-05-18 17:51:20 +01:00
};
}
#endif