doxygen/Stretcher_8cc_source.html

 //-----------------------------------------------------------------------------

 //

 //  $Id: Stretcher.cc 878 2014-11-23 04:51:23Z weegreenblobbie $

 //

 //  Nsound is a C++ library and Python module for audio synthesis featuring

 //  dynamic digital filters. Nsound lets you easily shape waveforms and write

 //  to disk or plot them. Nsound aims to be as powerful as Csound but easy to

 //  use.

 //

 //  Copyright (c) 2008 to Present Nick Hilton

 //

 //  weegreenblobbie_yahoo_com (replace '_' with '@' and '.')

 //

 //-----------------------------------------------------------------------------


 //-----------------------------------------------------------------------------

 //

 //  This program is free software; you can redistribute it and/or modify

 //  it under the terms of the GNU General Public License as published by

 //  the Free Software Foundation; either version 2 of the License, or

 //  (at your option) any later version.

 //

 //  This program is distributed in the hope that it will be useful,

 //  but WITHOUT ANY WARRANTY; without even the implied warranty of

 //  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

 //  GNU Library General Public License for more details.

 //

 //  You should have received a copy of the GNU General Public License

 //  along with this program; if not, write to the Free Software

 //  Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.

 //

 //-----------------------------------------------------------------------------


 #include <Nsound/AudioStream.h>

 #include <Nsound/Buffer.h>

 #include <Nsound/Sine.h>

 #include <Nsound/Stretcher.h>


 #include <cstdio>

 #include <algorithm>

 #include <cmath>

 #include <cstdlib>

 #include <deque>

 #include <set>


 using namespace Nsound;


 using std::cerr;

 using std::cout;

 using std::endl;


 //-----------------------------------------------------------------------------

 Stretcher::

 Stretcher(

     const float64 & sample_rate,

     const float64 & window_size_seconds,

     const float64 & max_delta_window)

     :

     frames_(NULL),

     sample_rate_(sample_rate),

     window_(NULL),

     window_length_(0),

     max_delta_(0),

     show_progress_(false)

 {

     frames_ = new Buffer(1024);

     window_ = new Buffer(1024);


     Sine sin(sample_rate);

     *window_ = sin.drawWindowHanning(window_size_seconds);

     window_length_ = window_->getLength();

     max_delta_ = uint32(float64(window_length_) * max_delta_window);

 }


 //-----------------------------------------------------------------------------

 Stretcher::

 Stretcher(const Stretcher & copy)

     :

     frames_(NULL),

     sample_rate_(copy.sample_rate_),

     window_(NULL),

     window_length_(copy.window_length_),

     max_delta_(copy.max_delta_),

     show_progress_(copy.show_progress_)

 {

     frames_ = new Buffer(1024);

     window_ = new Buffer(window_length_);


     *this = copy;

 }


 //-----------------------------------------------------------------------------

 Stretcher::

 ~Stretcher()

 {

     delete frames_;

     delete window_;

 }


 //-----------------------------------------------------------------------------

 Stretcher &

 Stretcher::

 operator=(const Stretcher & rhs)

 {

     if(this == & rhs) return *this;


     sample_rate_   = rhs.sample_rate_;

     window_length_ = rhs.window_length_;

     max_delta_     = rhs.max_delta_;

     *frames_       = *rhs.frames_;

     *window_       = *rhs.window_;

     show_progress_ = rhs.show_progress_;


     return *this;

 }


 void

 Stretcher::

 analyize(const Buffer & input, const float64 & f)

 {

     Buffer factor(1);

     factor << f;


     analyize(input, factor);

 }


 void

 Stretcher::

 analyize(const Buffer & input, const Buffer & factor)

 {

     // Always calculate time shift.


     Buffer::const_circular_iterator ifactor = factor.cbegin();


     uint32 tau = static_cast<uint32>(window_length_ / 2.0 / ::fabs(*ifactor));


     uint32 input_length = input.getLength();


     *frames_ = Buffer(256);


     uint32 i = 0;

     while(i < input_length - window_length_)

     {

         *frames_ << i;

         i += tau;


         ifactor += tau;


         tau = static_cast<uint32>(window_length_ / 2.0 / ::fabs(*ifactor));

     }


     uint32 n_frames = frames_->getLength();


     uint32 mod_frames = n_frames / 100;


     if(n_frames < 100) mod_frames = n_frames;


     if(show_progress_)

     {

         #ifdef NSOUND_CUDA


             printf("Using CUDA\n");


         #else


             #ifdef NSOUND_OPENMP

                 #pragma omp parallel

                 {

                     if(0 == omp_get_thread_num())

                     {

                         printf("Using OpenMP with %d threads\n",

                             omp_get_num_threads());

                         fflush(stdout);

                     }

                 }

             #endif


         #endif


         printf("Analyizing %3.0f%%", 0.0);

         fflush(stdout);

     }


     for(uint32 j = 0; j < n_frames-1; ++j)

     {

         if(show_progress_ && j % mod_frames == 0)

         {

             printf("\b\b\b\b");

             printf("%3.0f%%", 100.0 * float64(j) / float64(n_frames));

             fflush(stdout);

         }


         (*frames_)[j] = searchForBestMatch(

             input,

             uint32((*frames_)[j]),

             uint32((*frames_)[j+1]));

     }


     if(show_progress_)

     {

         printf("\b\b\b\b");

         printf("%3.0f%%\n", 100.0);

         fflush(stdout);

     }

 }


 uint32

 Stretcher::

 searchForBestMatch(

     const Buffer & input,

     uint32 source_index,

     uint32 search_index) const

 {

     // Nick's original score function

     #if 1

         Buffer b_source = input.subbuffer(source_index, window_length_);


         uint32 t = 0;

         float64 min_score = 1.0e100;


         #ifdef NSOUND_OPENMP

             #pragma omp parallel for shared(t, min_score)

         #endif

         for(uint32 i = 0; i < max_delta_; ++i)

         {

             Buffer b_test = input.subbuffer(search_index + i, window_length_)

                           - b_source;


             b_test *= b_test;


             float64 score = b_test.getSum();


             if(score < min_score)

             {

                 min_score = score;

                 t = i;

             }

         }

     #endif


     #if 0

         // Maximizing fft phase information.


         FFTransform transform(100.0); // Sample rate here won't be used.


         Buffer b_source = input.subbuffer(source_index, window_length_);


         FFTChunkVector vec = transform.fft(b_source, window_length_);


         Buffer source_fft = vec[0].getPhase();


         uint32 t = 0;

         float64 min_score = 1.0e100;

         for(uint32 i = 0; i < max_delta_; ++i)

         {

             Buffer b_test = input.subbuffer(search_index + i, window_length_);


             FFTChunkVector vec = transform.fft(b_test, window_length_);


             Buffer test_fft = vec[0].getPhase();


             Buffer delta = source_fft - test_fft;


             delta *= delta;


             float64 score = delta.getSum();


             if(score < min_score)

             {

                 min_score = score;

                 t = i;

             }

         }

     #endif


     return t + search_index;

 }


 Buffer

 Stretcher::

 overlapAdd(const Buffer & input) const

 {

     Sine sin(sample_rate_);


     float64 half_window_seconds = (window_length_ / 2) / sample_rate_;


     uint32 half_length = window_length_ / 2;


     Buffer window_start = sin.drawLine(half_window_seconds, 1.0, 1.0)

                        << window_->subbuffer(half_length, half_length);


     Buffer window_finish = window_start.getReverse();


     Buffer output = input.subbuffer(0, window_length_) * (*window_);


     uint32 n_frames = frames_->getLength();


     uint32 mod_frames = n_frames / 100;


     if(n_frames < 100) mod_frames = n_frames;


     if(show_progress_)

     {

         printf("Creating output %3.0f%%", 0.0);

         fflush(stdout);

     }


     for(uint32 i = 1; i < n_frames; ++i)

     {

         if(show_progress_ && i % mod_frames == 0)

         {

             printf("\b\b\b\b");

             printf("%3.0f%%", 100.0 * float64(i) / float64(n_frames));

             fflush(stdout);

         }


         uint32 frame = uint32((*frames_)[i]);


         Buffer next_window = input.subbuffer(frame, window_length_)

                            * (*window_);


         // overlap & add

         output.add(next_window, i * half_length);

     }


     if(show_progress_)

     {

         printf("\b\b\b\b");

         printf("%3.0f%%\n", 100.0);

         fflush(stdout);

     }


     return output;

 }


 AudioStream

 Stretcher::

 pitchShift(const AudioStream & x, const float64 & factor)

 {

     // Prepare for time shift.

     analyize(x.getMono()[0], factor);


     AudioStream y(x.getSampleRate(), x.getNChannels());


     for(uint32 i = 0; i < x.getNChannels(); ++i)

     {

         y[i] = overlapAdd(x[i]);

     }


     return y.getResample(1.0/factor);

 }


 AudioStream

 Stretcher::

 pitchShift(const AudioStream & x, const Buffer & factor)

 {

     // Prepare for time shift.

     analyize(x.getMono()[0], factor);


     AudioStream y(x.getSampleRate(), x.getNChannels());


     for(uint32 i = 0; i < x.getNChannels(); ++i)

     {

         y[i] = overlapAdd(x[i]);

     }


     return y.getSpeedUp(factor);

 }


 Buffer

 Stretcher::

 pitchShift(const Buffer & x, const float64 & factor)

 {

     // Prepare for time shift.

     analyize(x, factor);


     Buffer stretched = overlapAdd(x);


     return stretched.getResample(1.0/factor);

 }


 Buffer

 Stretcher::

 pitchShift(const Buffer & x, const Buffer & factor)

 {

     // Prepare for time shift.

     analyize(x, factor);


     Buffer stretched = overlapAdd(x);


     return stretched.getSpeedUp(factor);

 }


 AudioStream

 Stretcher::

 timeShift(const AudioStream & x, const float64 & factor)

 {

     // Prepare for time shift.

     analyize(x.getMono()[0], factor);


     AudioStream y(x.getSampleRate(), x.getNChannels());


     for(uint32 i = 0; i < x.getNChannels(); ++i)

     {

         y[i] = overlapAdd(x[i]);

     }


     return y;

 }


 AudioStream

 Stretcher::

 timeShift(const AudioStream & x, const Buffer & factor)

 {

     // Prepare for time shift.

     analyize(x.getMono()[0], factor);


     AudioStream y(x.getSampleRate(), x.getNChannels());


     for(uint32 i = 0; i < x.getNChannels(); ++i)

     {

         y[i] = overlapAdd(x[i]);

     }


     return y;

 }


 Buffer

 Stretcher::

 timeShift(const Buffer & x, const float64 & factor)

 {

     // Prepare for time shift.

     analyize(x, factor);


     Buffer stretched = overlapAdd(x);


     return stretched;

 }


 Buffer

 Stretcher::

 timeShift(const Buffer & x, const Buffer & factor)

 {

     // Prepare for time shift.

     analyize(x, factor);


     Buffer stretched = overlapAdd(x);


     return stretched;

 }


Nsound::Buffer::subbuffer
Buffer subbuffer(uint32 start_index, uint32 n_samples=0) const
Slice the Buffer.
Definition: Buffer.cc:2073

Nsound::uint32
unsigned int uint32
Definition: Nsound.h:153

Nsound::Buffer::getSpeedUp
Buffer getSpeedUp(float64 step_size) const
Resamples a copy of this Buffer by the step_size, no interpolation.
Definition: Buffer.h:1707

Nsound::AudioStream::getSampleRate
float64 getSampleRate() const
Returns the sample rate of the stream.
Definition: AudioStream.h:217

Nsound::Stretcher::window_
Buffer * window_
Definition: Stretcher.h:119

Nsound::Stretcher::pitchShift
AudioStream pitchShift(const AudioStream &x, const float64 &factor)
Definition: Stretcher.cc:338

Nsound::Stretcher::searchForBestMatch
uint32 searchForBestMatch(const Buffer &input, uint32 source_index, uint32 search_index) const
Definition: Stretcher.cc:209

Nsound::Stretcher
WSOLA.
Definition: Stretcher.h:49

Nsound::Stretcher::operator=
Stretcher & operator=(const Stretcher &rhs)
Assignment.
Definition: Stretcher.cc:103

Nsound::float64
double float64
Definition: Nsound.h:146

Nsound::Stretcher::overlapAdd
Buffer overlapAdd(const Buffer &input) const
Definition: Stretcher.cc:281

Nsound::Buffer::cbegin
circular_iterator cbegin()
Retruns the itreator at the start of the Buffer.
Definition: Buffer.h:318

Nsound::Stretcher::~Stretcher
virtual ~Stretcher()
Destructor.
Definition: Stretcher.cc:94

Nsound::Stretcher::window_length_
uint32 window_length_
Definition: Stretcher.h:120

Nsound::Generator::drawWindowHanning
Buffer drawWindowHanning(const float64 &duration) const
Draws a Hanning window.
Definition: Generator.cc:819

Nsound::Buffer::getLength
uint32 getLength() const
Returns the number of samples in the Buffer.
Definition: Buffer.h:587

Stretcher.h

Nsound::AudioStream::getNChannels
uint32 getNChannels(void) const
Returns the number of audio channels in the stream.
Definition: AudioStream.h:212

Nsound::Stretcher::frames_
Buffer * frames_
Definition: Stretcher.h:117

Sine.h

Nsound::const_circular_iterator
Definition: CircularIterators.h:212

Nsound::AudioStream
Definition: AudioStream.h:52

Nsound::Stretcher::show_progress_
boolean show_progress_
Definition: Stretcher.h:122

Nsound::FFTransform
A Class that performes the Fast Fouier Transfrom on a Buffer.
Definition: FFTransform.h:57

Nsound::Stretcher::timeShift
AudioStream timeShift(const AudioStream &x, const float64 &factor)
Definition: Stretcher.cc:396

Nsound::Buffer::getSum
float64 getSum() const
Returns the sum of all samples.
Definition: Buffer.cc:1118

Nsound::Buffer
A Buffer for storing audio samples.
Definition: Buffer.h:60

Nsound::Stretcher::sample_rate_
float64 sample_rate_
Definition: Stretcher.h:118

Nsound::FFTransform::fft
Buffer fft(const Buffer &time_domain) const
Transforms the time_domain signal and calculates the FFT.
Definition: FFTransform.cc:50

Nsound::Buffer::getResample
Buffer getResample(float64 factor, const uint32 N=10, float64 beta=5.0) const
Resamples a copy of this Buffer using discrete-time resampling.
Definition: Buffer.cc:1607

Nsound::AudioStream::getMono
AudioStream getMono() const
Collapses all channels into one Buffer making it mono.
Definition: AudioStream.cc:265

Nsound::Stretcher::analyize
void analyize(const Buffer &input, const float64 &factor)
Definition: Stretcher.cc:119

Nsound::Stretcher::Stretcher
Stretcher(const float64 &sample_rate, const float64 &window_size_seconds=0.08, const float64 &max_delta_window=0.25)
Default Constructor.
Definition: Stretcher.cc:54

Nsound::Generator::drawLine
Buffer drawLine(const float64 &duration, const float64 &amplitude_start, const float64 &amplitude_finish) const
This method draws a linear line beteween 2 points.
Definition: Generator.cc:464

Nsound::Buffer::add
void add(const Buffer &buffer, uint32 offset=0, uint32 n_samples=0)
This method adds buffer to *this.
Definition: Buffer.cc:225

Buffer.h

Nsound::Buffer::getReverse
Buffer getReverse() const
Reverses the samples in a copy of this Buffer.
Definition: Buffer.h:1558

AudioStream.h

Nsound::Stretcher::max_delta_
uint32 max_delta_
Definition: Stretcher.h:121

Nsound::FFTChunkVector
std::vector< FFTChunk > FFTChunkVector
Definition: FFTChunk.h:119

Nsound::Sine
DOXME.
Definition: Sine.h:43