summaryrefslogtreecommitdiff
path: root/src/io/source_wavread.c
diff options
context:
space:
mode:
Diffstat (limited to 'src/io/source_wavread.c')
-rw-r--r--src/io/source_wavread.c411
1 files changed, 411 insertions, 0 deletions
diff --git a/src/io/source_wavread.c b/src/io/source_wavread.c
new file mode 100644
index 0000000..d1b1f3a
--- /dev/null
+++ b/src/io/source_wavread.c
@@ -0,0 +1,411 @@
+/*
+ Copyright (C) 2014 Paul Brossier <piem@aubio.org>
+
+ This file is part of aubio.
+
+ aubio is free software: you can redistribute it and/or modify
+ it under the terms of the GNU General Public License as published by
+ the Free Software Foundation, either version 3 of the License, or
+ (at your option) any later version.
+
+ aubio is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+ GNU General Public License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with aubio. If not, see <http://www.gnu.org/licenses/>.
+
+*/
+
+#include "config.h"
+
+#ifdef HAVE_WAVREAD
+
+#include "aubio_priv.h"
+#include "fvec.h"
+#include "fmat.h"
+#include "source_wavread.h"
+
+#include <errno.h>
+
+#define AUBIO_WAVREAD_BUFSIZE 1024
+
+#define SHORT_TO_FLOAT(x) (smpl_t)(x * 3.0517578125e-05)
+
+struct _aubio_source_wavread_t {
+ uint_t hop_size;
+ uint_t samplerate;
+ uint_t channels;
+
+ // some data about the file
+ char_t *path;
+ uint_t input_samplerate;
+ uint_t input_channels;
+
+ // internal stuff
+ FILE *fid;
+
+ uint_t read_samples;
+ uint_t blockalign;
+ uint_t bitspersample;
+ uint_t read_index;
+ uint_t eof;
+
+ uint_t duration;
+
+ size_t seek_start;
+
+ unsigned char *short_output;
+ fmat_t *output;
+};
+
+unsigned int read_little_endian (unsigned char *buf, unsigned int length);
+unsigned int read_little_endian (unsigned char *buf, unsigned int length) {
+ uint_t i, ret = 0;
+ for (i = 0; i < length; i++) {
+ ret += buf[i] << (i * 8);
+ }
+ return ret;
+}
+
+aubio_source_wavread_t * new_aubio_source_wavread(const char_t * path, uint_t samplerate, uint_t hop_size) {
+ aubio_source_wavread_t * s = AUBIO_NEW(aubio_source_wavread_t);
+ size_t bytes_read = 0, bytes_expected = 44;
+ unsigned char buf[5];
+ unsigned int format, channels, sr, byterate, blockalign, duration, bitspersample;//, data_size;
+
+ if (path == NULL) {
+ AUBIO_ERR("source_wavread: Aborted opening null path\n");
+ goto beach;
+ }
+ if ((sint_t)samplerate < 0) {
+ AUBIO_ERR("source_wavread: Can not open %s with samplerate %d\n", path, samplerate);
+ goto beach;
+ }
+ if ((sint_t)hop_size <= 0) {
+ AUBIO_ERR("source_wavread: Can not open %s with hop_size %d\n", path, hop_size);
+ goto beach;
+ }
+
+ if (s->path) AUBIO_FREE(s->path);
+ s->path = AUBIO_ARRAY(char_t, strnlen(path, PATH_MAX) + 1);
+ strncpy(s->path, path, strnlen(path, PATH_MAX) + 1);
+
+ s->samplerate = samplerate;
+ s->hop_size = hop_size;
+
+ s->fid = fopen((const char *)path, "rb");
+ if (!s->fid) {
+ AUBIO_ERR("source_wavread: Failed opening %s (System error: %s)\n", s->path, strerror(errno));
+ goto beach;
+ }
+
+ // ChunkID
+ bytes_read += fread(buf, 1, 4, s->fid);
+ buf[4] = '\0';
+ if ( strcmp((const char *)buf, "RIFF") != 0 ) {
+ AUBIO_ERR("source_wavread: could not find RIFF header in %s\n", s->path);
+ goto beach;
+ }
+
+ // ChunkSize
+ bytes_read += fread(buf, 1, 4, s->fid);
+
+ // Format
+ bytes_read += fread(buf, 1, 4, s->fid);
+ buf[4] = '\0';
+ if ( strcmp((const char *)buf, "WAVE") != 0 ) {
+ AUBIO_ERR("source_wavread: wrong format in RIFF header in %s\n", s->path);
+ goto beach;
+ }
+
+ // Subchunk1ID
+ bytes_read += fread(buf, 1, 4, s->fid);
+ buf[4] = '\0';
+ if ( strcmp((const char *)buf, "fmt ") != 0 ) {
+ AUBIO_ERR("source_wavread: fmt RIFF header in %s\n", s->path);
+ goto beach;
+ }
+
+ // Subchunk1Size
+ bytes_read += fread(buf, 1, 4, s->fid);
+ format = read_little_endian(buf, 4);
+ if ( format != 16 ) {
+ // TODO accept format 18
+ AUBIO_ERR("source_wavread: file %s is not encoded with PCM\n", s->path);
+ goto beach;
+ }
+ if ( buf[1] || buf[2] | buf[3] ) {
+ AUBIO_ERR("source_wavread: Subchunk1Size should be 0, in %s\n", s->path);
+ goto beach;
+ }
+
+ // AudioFormat
+ bytes_read += fread(buf, 1, 2, s->fid);
+ if ( buf[0] != 1 || buf[1] != 0) {
+ AUBIO_ERR("source_wavread: AudioFormat should be PCM, in %s\n", s->path);
+ goto beach;
+ }
+
+ // NumChannels
+ bytes_read += fread(buf, 1, 2, s->fid);
+ channels = read_little_endian(buf, 2);
+
+ // SampleRate
+ bytes_read += fread(buf, 1, 4, s->fid);
+ sr = read_little_endian(buf, 4);
+
+ // ByteRate
+ bytes_read += fread(buf, 1, 4, s->fid);
+ byterate = read_little_endian(buf, 4);
+
+ // BlockAlign
+ bytes_read += fread(buf, 1, 2, s->fid);
+ blockalign = read_little_endian(buf, 2);
+
+ // BitsPerSample
+ bytes_read += fread(buf, 1, 2, s->fid);
+ bitspersample = read_little_endian(buf, 2);
+#if 0
+ if ( bitspersample != 16 ) {
+ AUBIO_ERR("source_wavread: can not process %dbit file %s\n",
+ bitspersample, s->path);
+ goto beach;
+ }
+#endif
+
+ if ( byterate * 8 != sr * channels * bitspersample ) {
+ AUBIO_ERR("source_wavread: wrong byterate in %s\n", s->path);
+ goto beach;
+ }
+
+ if ( blockalign * 8 != channels * bitspersample ) {
+ AUBIO_ERR("source_wavread: wrong blockalign in %s\n", s->path);
+ goto beach;
+ }
+
+ s->input_samplerate = sr;
+ s->input_channels = channels;
+
+#if 0
+ AUBIO_DBG("channels %d\n", channels);
+ AUBIO_DBG("sr %d\n", sr);
+ AUBIO_DBG("byterate %d\n", byterate);
+ AUBIO_DBG("blockalign %d\n", blockalign);
+ AUBIO_DBG("bitspersample %d\n", bitspersample);
+
+ AUBIO_DBG("found %d channels in %s\n", s->input_channels, s->path);
+ AUBIO_DBG("found %d samplerate in %s\n", s->input_samplerate, s->path);
+#endif
+
+ if (samplerate == 0) {
+ s->samplerate = s->input_samplerate;
+ } else if (samplerate != s->input_samplerate) {
+ AUBIO_ERR("source_wavread: can not resample %s from %d to %dHz\n",
+ s->path, s->input_samplerate, samplerate);
+ goto beach;
+ }
+
+ // Subchunk2ID
+ bytes_read += fread(buf, 1, 4, s->fid);
+ buf[4] = '\0';
+ if ( strcmp((const char *)buf, "data") != 0 ) {
+ AUBIO_ERR("source_wavread: data RIFF header not found in %s\n", s->path);
+ goto beach;
+ }
+
+ // Subchunk2Size
+ bytes_read += fread(buf, 1, 4, s->fid);
+ duration = read_little_endian(buf, 4) / blockalign;
+
+ //data_size = buf[0] + (buf[1] << 8) + (buf[2] << 16) + (buf[3] << 24);
+ //AUBIO_MSG("found %d frames in %s\n", 8 * data_size / bitspersample / channels, s->path);
+
+ // check the total number of bytes read is correct
+ if ( bytes_read != bytes_expected ) {
+#ifndef HAVE_WIN_HACKS
+ AUBIO_ERR("source_wavread: short read (%zd instead of %zd) in %s\n",
+ bytes_read, bytes_expected, s->path);
+#else // mingw does not know about %zd...
+ AUBIO_ERR("source_wavread: short read (%d instead of %d) in %s\n",
+ (int)bytes_read, (int)bytes_expected, s->path);
+#endif
+ goto beach;
+ }
+ s->seek_start = bytes_read;
+
+ s->output = new_fmat(s->input_channels, AUBIO_WAVREAD_BUFSIZE);
+ s->blockalign= blockalign;
+ s->bitspersample = bitspersample;
+
+ s->duration = duration;
+
+ s->short_output = (unsigned char *)calloc(s->blockalign, AUBIO_WAVREAD_BUFSIZE);
+ s->read_index = 0;
+ s->read_samples = 0;
+ s->eof = 0;
+
+ return s;
+
+beach:
+ //AUBIO_ERR("source_wavread: can not read %s at samplerate %dHz with a hop_size of %d\n",
+ // s->path, s->samplerate, s->hop_size);
+ del_aubio_source_wavread(s);
+ return NULL;
+}
+
+void aubio_source_wavread_readframe(aubio_source_wavread_t *s, uint_t *wavread_read);
+
+void aubio_source_wavread_readframe(aubio_source_wavread_t *s, uint_t *wavread_read) {
+ unsigned char *short_ptr = s->short_output;
+ size_t read = fread(short_ptr, s->blockalign, AUBIO_WAVREAD_BUFSIZE, s->fid);
+ uint_t i, j, b, bitspersample = s->bitspersample;
+ uint_t wrap_at = (1 << ( bitspersample - 1 ) );
+ uint_t wrap_with = (1 << bitspersample);
+ smpl_t scaler = 1. / wrap_at;
+ int signed_val = 0;
+ unsigned int unsigned_val = 0;
+
+ for (j = 0; j < read; j++) {
+ for (i = 0; i < s->input_channels; i++) {
+ unsigned_val = 0;
+ for (b = 0; b < bitspersample; b+=8 ) {
+ unsigned_val += *(short_ptr) << b;
+ short_ptr++;
+ }
+ signed_val = unsigned_val;
+ // FIXME why does 8 bit conversion maps [0;255] to [-128;127]
+ // instead of [0;127] to [0;127] and [128;255] to [-128;-1]
+ if (bitspersample == 8) signed_val -= wrap_at;
+ else if (unsigned_val >= wrap_at) signed_val = unsigned_val - wrap_with;
+ s->output->data[i][j] = signed_val * scaler;
+ }
+ }
+
+ *wavread_read = read;
+
+ if (read == 0) s->eof = 1;
+}
+
+void aubio_source_wavread_do(aubio_source_wavread_t * s, fvec_t * read_data, uint_t * read){
+ uint_t i, j;
+ uint_t end = 0;
+ uint_t total_wrote = 0;
+ while (total_wrote < s->hop_size) {
+ end = MIN(s->read_samples - s->read_index, s->hop_size - total_wrote);
+ for (i = 0; i < end; i++) {
+ read_data->data[i + total_wrote] = 0;
+ for (j = 0; j < s->input_channels; j++ ) {
+ read_data->data[i + total_wrote] += s->output->data[j][i + s->read_index];
+ }
+ read_data->data[i + total_wrote] /= (smpl_t)(s->input_channels);
+ }
+ total_wrote += end;
+ if (total_wrote < s->hop_size) {
+ uint_t wavread_read = 0;
+ aubio_source_wavread_readframe(s, &wavread_read);
+ s->read_samples = wavread_read;
+ s->read_index = 0;
+ if (s->eof) {
+ break;
+ }
+ } else {
+ s->read_index += end;
+ }
+ }
+ if (total_wrote < s->hop_size) {
+ for (i = end; i < s->hop_size; i++) {
+ read_data->data[i] = 0.;
+ }
+ }
+ *read = total_wrote;
+}
+
+void aubio_source_wavread_do_multi(aubio_source_wavread_t * s, fmat_t * read_data, uint_t * read){
+ uint_t i,j;
+ uint_t end = 0;
+ uint_t total_wrote = 0;
+ while (total_wrote < s->hop_size) {
+ end = MIN(s->read_samples - s->read_index, s->hop_size - total_wrote);
+ for (j = 0; j < read_data->height; j++) {
+ for (i = 0; i < end; i++) {
+ read_data->data[j][i + total_wrote] = s->output->data[j][i];
+ }
+ }
+ total_wrote += end;
+ if (total_wrote < s->hop_size) {
+ uint_t wavread_read = 0;
+ aubio_source_wavread_readframe(s, &wavread_read);
+ s->read_samples = wavread_read;
+ s->read_index = 0;
+ if (s->eof) {
+ break;
+ }
+ } else {
+ s->read_index += end;
+ }
+ }
+ if (total_wrote < s->hop_size) {
+ for (j = 0; j < read_data->height; j++) {
+ for (i = end; i < s->hop_size; i++) {
+ read_data->data[j][i] = 0.;
+ }
+ }
+ }
+ *read = total_wrote;
+}
+
+uint_t aubio_source_wavread_get_samplerate(aubio_source_wavread_t * s) {
+ return s->samplerate;
+}
+
+uint_t aubio_source_wavread_get_channels(aubio_source_wavread_t * s) {
+ return s->input_channels;
+}
+
+uint_t aubio_source_wavread_seek (aubio_source_wavread_t * s, uint_t pos) {
+ uint_t ret = 0;
+ if ((sint_t)pos < 0) {
+ return AUBIO_FAIL;
+ }
+ ret = fseek(s->fid, s->seek_start + pos * s->blockalign, SEEK_SET);
+ if (ret != 0) {
+ AUBIO_ERR("source_wavread: could not seek %s at %d (%s)\n", s->path, pos, strerror(errno));
+ return AUBIO_FAIL;
+ }
+ // reset some values
+ s->eof = 0;
+ s->read_index = 0;
+ return AUBIO_OK;
+}
+
+uint_t aubio_source_wavread_get_duration (const aubio_source_wavread_t * s) {
+ if (s && s->duration) {
+ return s->duration;
+ }
+ return 0;
+}
+
+uint_t aubio_source_wavread_close (aubio_source_wavread_t * s) {
+ if (!s->fid) {
+ return AUBIO_FAIL;
+ }
+ if (fclose(s->fid)) {
+ AUBIO_ERR("source_wavread: could not close %s (%s)\n", s->path, strerror(errno));
+ return AUBIO_FAIL;
+ }
+ s->fid = NULL;
+ return AUBIO_OK;
+}
+
+void del_aubio_source_wavread(aubio_source_wavread_t * s) {
+ if (!s) return;
+ aubio_source_wavread_close(s);
+ if (s->short_output) AUBIO_FREE(s->short_output);
+ if (s->output) del_fmat(s->output);
+ if (s->path) AUBIO_FREE(s->path);
+ AUBIO_FREE(s);
+}
+
+#endif /* HAVE_WAVREAD */