123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201 |
- /*
- * SpanDSP - a series of DSP components for telephony
- *
- * time_scale_tests.c
- *
- * Written by Steve Underwood <steveu@coppice.org>
- *
- * Copyright (C) 2004 Steve Underwood
- *
- * All rights reserved.
- *
- * This program is free software; you can redistribute it and/or modify
- * it under the terms of the GNU General Public License version 2, as
- * published by the Free Software Foundation.
- *
- * This program is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- * GNU General Public License for more details.
- *
- * You should have received a copy of the GNU General Public License
- * along with this program; if not, write to the Free Software
- * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
- */
- /*! \page time_scale_tests_page Time scaling tests
- \section time_scale_tests_page_sec_1 What does it do?
- These tests run a speech file through the time scaling routines.
- \section time_scale_tests_page_sec_2 How are the tests run?
- These tests process a speech file called pre_time_scale.wav. This file should contain
- 8000 sample/second 16 bits/sample linear audio. The tests read this file, change the
- time scale of its contents, and write the resulting audio to post_time_scale.wav.
- This file also contains 8000 sample/second 16 bits/sample linear audio.
- */
- #if defined(HAVE_CONFIG_H)
- #include "config.h"
- #endif
- #include <stdlib.h>
- #include <stdio.h>
- #include <unistd.h>
- #include <string.h>
- #include <sndfile.h>
- #include "spandsp.h"
- #include "spandsp/private/time_scale.h"
- #define BLOCK_LEN 160
- #define IN_FILE_NAME "../test-data/local/short_nb_voice.wav"
- #define OUT_FILE_NAME "time_scale_result.wav"
- int main(int argc, char *argv[])
- {
- SNDFILE *inhandle;
- SNDFILE *outhandle;
- SF_INFO info;
- int16_t in[BLOCK_LEN];
- int16_t out[5*(BLOCK_LEN + TIME_SCALE_MAX_SAMPLE_RATE/TIME_SCALE_MIN_PITCH)];
- int frames;
- int new_frames;
- int out_frames;
- int count;
- int max;
- int samples_in;
- int samples_out;
- time_scale_state_t state;
- float rate;
- float sample_rate;
- const char *in_file_name;
- bool sweep_rate;
- int opt;
- rate = 1.8f;
- sweep_rate = false;
- in_file_name = IN_FILE_NAME;
- while ((opt = getopt(argc, argv, "i:r:s")) != -1)
- {
- switch (opt)
- {
- case 'i':
- in_file_name = optarg;
- break;
- case 'r':
- rate = atof(optarg);
- break;
- case 's':
- sweep_rate = true;
- break;
- default:
- //usage();
- exit(2);
- break;
- }
- }
- memset(&info, 0, sizeof(info));
- if ((inhandle = sf_open(in_file_name, SFM_READ, &info)) == NULL)
- {
- printf(" Cannot open audio file '%s'\n", in_file_name);
- exit(2);
- }
- if (info.channels != 1)
- {
- printf(" Unexpected number of channels in audio file '%s'\n", in_file_name);
- exit(2);
- }
- sample_rate = info.samplerate;
- memset(&info, 0, sizeof(info));
- info.frames = 0;
- info.samplerate = sample_rate;
- info.channels = 1;
- info.format = SF_FORMAT_WAV | SF_FORMAT_PCM_16;
- info.sections = 1;
- info.seekable = 1;
- if ((outhandle = sf_open(OUT_FILE_NAME, SFM_WRITE, &info)) == NULL)
- {
- fprintf(stderr, " Cannot create audio file '%s'\n", OUT_FILE_NAME);
- exit(2);
- }
- if ((time_scale_init(&state, (int) sample_rate, rate)) == NULL)
- {
- fprintf(stderr, " Cannot start the time scaler\n");
- exit(2);
- }
- max = time_scale_max_output_len(&state, BLOCK_LEN);
- printf("Rate is %f, longest output block is %d\n", rate, max);
- count = 0;
- samples_in = 0;
- samples_out = 0;
- while ((frames = sf_readf_short(inhandle, in, BLOCK_LEN)))
- {
- samples_in += frames;
- new_frames = time_scale(&state, out, in, frames);
- if (new_frames > max)
- {
- printf("Generated signal has more than the expected maximum samples - %d vs %d\n", new_frames, max);
- printf("Tests failed\n");
- exit(2);
- }
- samples_out += new_frames;
- out_frames = sf_writef_short(outhandle, out, new_frames);
- if (out_frames != new_frames)
- {
- fprintf(stderr, " Error writing audio file\n");
- exit(2);
- }
- if (sweep_rate && ++count > 100)
- {
- if (rate > 0.5f)
- {
- rate -= 0.1f;
- if (rate >= 0.99f && rate <= 1.01f)
- rate -= 0.1f;
- time_scale_init(&state, SAMPLE_RATE, rate);
- max = time_scale_max_output_len(&state, BLOCK_LEN);
- printf("Rate is %f, longest output block is %d\n", rate, max);
- }
- count = 0;
- }
- }
- new_frames = time_scale_flush(&state, out);
- if (new_frames > max)
- {
- printf("Generated signal has more than the expected maximum samples - %d vs %d\n", new_frames, max);
- printf("Tests failed\n");
- exit(2);
- }
- samples_out += new_frames;
- out_frames = sf_writef_short(outhandle, out, new_frames);
- if (out_frames != new_frames)
- {
- fprintf(stderr, " Error writing audio file\n");
- exit(2);
- }
- time_scale_release(&state);
- if ((int) (rate*samples_in) < samples_out - 1 || (int) (rate*samples_in) > samples_out + 1)
- {
- printf("%d samples became %d samples\n", (int) (rate*samples_in), samples_out);
- printf("Tests failed\n");
- exit(2);
- }
- if (sf_close(inhandle))
- {
- printf(" Cannot close audio file '%s'\n", in_file_name);
- exit(2);
- }
- if (sf_close(outhandle))
- {
- printf(" Cannot close audio file '%s'\n", OUT_FILE_NAME);
- exit(2);
- }
- return 0;
- }
- /*- End of function --------------------------------------------------------*/
- /*- End of file ------------------------------------------------------------*/
|