forked from Mirrors/freeswitch
202 lines
5.9 KiB
C
202 lines
5.9 KiB
C
/*
|
|
* SpanDSP - a series of DSP components for telephony
|
|
*
|
|
* time_scale_tests.c
|
|
*
|
|
* Written by Steve Underwood <steveu@coppice.org>
|
|
*
|
|
* Copyright (C) 2004 Steve Underwood
|
|
*
|
|
* All rights reserved.
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License version 2, as
|
|
* published by the Free Software Foundation.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program; if not, write to the Free Software
|
|
* Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
|
|
*/
|
|
|
|
/*! \page time_scale_tests_page Time scaling tests
|
|
\section time_scale_tests_page_sec_1 What does it do?
|
|
These tests run a speech file through the time scaling routines.
|
|
|
|
\section time_scale_tests_page_sec_2 How are the tests run?
|
|
These tests process a speech file called pre_time_scale.wav. This file should contain
|
|
8000 sample/second 16 bits/sample linear audio. The tests read this file, change the
|
|
time scale of its contents, and write the resulting audio to post_time_scale.wav.
|
|
This file also contains 8000 sample/second 16 bits/sample linear audio.
|
|
*/
|
|
|
|
#if defined(HAVE_CONFIG_H)
|
|
#include "config.h"
|
|
#endif
|
|
|
|
#include <stdlib.h>
|
|
#include <stdio.h>
|
|
#include <unistd.h>
|
|
#include <string.h>
|
|
#include <sndfile.h>
|
|
|
|
#include "spandsp.h"
|
|
|
|
#include "spandsp/private/time_scale.h"
|
|
|
|
#define BLOCK_LEN 160
|
|
|
|
#define IN_FILE_NAME "../test-data/local/short_nb_voice.wav"
|
|
#define OUT_FILE_NAME "time_scale_result.wav"
|
|
|
|
int main(int argc, char *argv[])
|
|
{
|
|
SNDFILE *inhandle;
|
|
SNDFILE *outhandle;
|
|
SF_INFO info;
|
|
int16_t in[BLOCK_LEN];
|
|
int16_t out[5*(BLOCK_LEN + TIME_SCALE_MAX_SAMPLE_RATE/TIME_SCALE_MIN_PITCH)];
|
|
int frames;
|
|
int new_frames;
|
|
int out_frames;
|
|
int count;
|
|
int max;
|
|
int samples_in;
|
|
int samples_out;
|
|
time_scale_state_t state;
|
|
float rate;
|
|
float sample_rate;
|
|
const char *in_file_name;
|
|
bool sweep_rate;
|
|
int opt;
|
|
|
|
rate = 1.8f;
|
|
sweep_rate = false;
|
|
in_file_name = IN_FILE_NAME;
|
|
while ((opt = getopt(argc, argv, "i:r:s")) != -1)
|
|
{
|
|
switch (opt)
|
|
{
|
|
case 'i':
|
|
in_file_name = optarg;
|
|
break;
|
|
case 'r':
|
|
rate = atof(optarg);
|
|
break;
|
|
case 's':
|
|
sweep_rate = true;
|
|
break;
|
|
default:
|
|
//usage();
|
|
exit(2);
|
|
break;
|
|
}
|
|
}
|
|
memset(&info, 0, sizeof(info));
|
|
if ((inhandle = sf_open(in_file_name, SFM_READ, &info)) == NULL)
|
|
{
|
|
printf(" Cannot open audio file '%s'\n", in_file_name);
|
|
exit(2);
|
|
}
|
|
if (info.channels != 1)
|
|
{
|
|
printf(" Unexpected number of channels in audio file '%s'\n", in_file_name);
|
|
exit(2);
|
|
}
|
|
sample_rate = info.samplerate;
|
|
|
|
memset(&info, 0, sizeof(info));
|
|
info.frames = 0;
|
|
info.samplerate = sample_rate;
|
|
info.channels = 1;
|
|
info.format = SF_FORMAT_WAV | SF_FORMAT_PCM_16;
|
|
info.sections = 1;
|
|
info.seekable = 1;
|
|
|
|
if ((outhandle = sf_open(OUT_FILE_NAME, SFM_WRITE, &info)) == NULL)
|
|
{
|
|
fprintf(stderr, " Cannot create audio file '%s'\n", OUT_FILE_NAME);
|
|
exit(2);
|
|
}
|
|
|
|
if ((time_scale_init(&state, (int) sample_rate, rate)) == NULL)
|
|
{
|
|
fprintf(stderr, " Cannot start the time scaler\n");
|
|
exit(2);
|
|
}
|
|
max = time_scale_max_output_len(&state, BLOCK_LEN);
|
|
printf("Rate is %f, longest output block is %d\n", rate, max);
|
|
count = 0;
|
|
samples_in = 0;
|
|
samples_out = 0;
|
|
while ((frames = sf_readf_short(inhandle, in, BLOCK_LEN)))
|
|
{
|
|
samples_in += frames;
|
|
new_frames = time_scale(&state, out, in, frames);
|
|
if (new_frames > max)
|
|
{
|
|
printf("Generated signal has more than the expected maximum samples - %d vs %d\n", new_frames, max);
|
|
printf("Tests failed\n");
|
|
exit(2);
|
|
}
|
|
samples_out += new_frames;
|
|
out_frames = sf_writef_short(outhandle, out, new_frames);
|
|
if (out_frames != new_frames)
|
|
{
|
|
fprintf(stderr, " Error writing audio file\n");
|
|
exit(2);
|
|
}
|
|
if (sweep_rate && ++count > 100)
|
|
{
|
|
if (rate > 0.5f)
|
|
{
|
|
rate -= 0.1f;
|
|
if (rate >= 0.99f && rate <= 1.01f)
|
|
rate -= 0.1f;
|
|
time_scale_init(&state, SAMPLE_RATE, rate);
|
|
max = time_scale_max_output_len(&state, BLOCK_LEN);
|
|
printf("Rate is %f, longest output block is %d\n", rate, max);
|
|
}
|
|
count = 0;
|
|
}
|
|
}
|
|
new_frames = time_scale_flush(&state, out);
|
|
if (new_frames > max)
|
|
{
|
|
printf("Generated signal has more than the expected maximum samples - %d vs %d\n", new_frames, max);
|
|
printf("Tests failed\n");
|
|
exit(2);
|
|
}
|
|
samples_out += new_frames;
|
|
out_frames = sf_writef_short(outhandle, out, new_frames);
|
|
if (out_frames != new_frames)
|
|
{
|
|
fprintf(stderr, " Error writing audio file\n");
|
|
exit(2);
|
|
}
|
|
time_scale_release(&state);
|
|
if ((int) (rate*samples_in) < samples_out - 1 || (int) (rate*samples_in) > samples_out + 1)
|
|
{
|
|
printf("%d samples became %d samples\n", (int) (rate*samples_in), samples_out);
|
|
printf("Tests failed\n");
|
|
exit(2);
|
|
}
|
|
if (sf_close(inhandle))
|
|
{
|
|
printf(" Cannot close audio file '%s'\n", in_file_name);
|
|
exit(2);
|
|
}
|
|
if (sf_close(outhandle))
|
|
{
|
|
printf(" Cannot close audio file '%s'\n", OUT_FILE_NAME);
|
|
exit(2);
|
|
}
|
|
return 0;
|
|
}
|
|
/*- End of function --------------------------------------------------------*/
|
|
/*- End of file ------------------------------------------------------------*/
|