Ejemplo n.º 1
0
static THTensor * libsox_(read_audio_file)(const char *file_name)
{
  // Create sox objects and read into int32_t buffer
  sox_format_t *fd;
  fd = sox_open_read(file_name, NULL, NULL, NULL);
  if (fd == NULL)
    abort_("[read_audio_file] Failure to read file");
  
  int nchannels = fd->signal.channels;
  long buffer_size = fd->signal.length;
  int32_t *buffer = (int32_t *)malloc(sizeof(int32_t) * buffer_size);
  size_t samples_read = sox_read(fd, buffer, buffer_size);
  if (samples_read == 0)
    abort_("[read_audio_file] Empty file or read failed in sox_read");
  // alloc tensor 
  THTensor *tensor = THTensor_(newWithSize2d)(nchannels, samples_read / nchannels );
  tensor = THTensor_(newContiguous)(tensor);
  real *tensor_data = THTensor_(data)(tensor);
  // convert audio to dest tensor 
  int x,k;
  for (k=0; k<nchannels; k++) {
    for (x=0; x<samples_read/nchannels; x++) {
      *tensor_data++ = (real)buffer[x*nchannels+k];
    }
  }
  // free buffer and sox structures
  sox_close(fd);
  free(buffer);
  THTensor_(free)(tensor);

  // return tensor 
  return tensor;
}
Ejemplo n.º 2
0
/*
 * On an alsa capable system, plays an audio file starting 10 seconds in.
 * Copes with sample-rate and channel change if necessary since its
 * common for audio drivers to support a subset of rates and channel
 * counts.
 * E.g. example3 song2.ogg
 *
 * Can easily be changed to work with other audio device drivers supported
 * by libSoX; e.g. "oss", "ao", "coreaudio", etc.
 * See the soxformat(7) manual page.
 */
int main(int argc, char * argv[])
{
  static sox_format_t * in, * out; /* input and output files */
  sox_effects_chain_t * chain;
  sox_effect_t * e;
  sox_signalinfo_t interm_signal;
  char * args[10];

  assert(argc == 2);
  sox_globals.output_message_handler = output_message;
  sox_globals.verbosity = 1;

  assert(sox_init() == SOX_SUCCESS);
  assert(in = sox_open_read(argv[1], NULL, NULL, NULL));
  /* Change "alsa" in this line to use an alternative audio device driver: */
  assert(out= sox_open_write("default", &in->signal, NULL, "alsa", NULL, NULL));

  chain = sox_create_effects_chain(&in->encoding, &out->encoding);

  interm_signal = in->signal; /* NB: deep copy */

  e = sox_create_effect(sox_find_effect("input"));
  args[0] = (char *)in, assert(sox_effect_options(e, 1, args) == SOX_SUCCESS);
  assert(sox_add_effect(chain, e, &interm_signal, &in->signal) == SOX_SUCCESS);
  free(e);

  e = sox_create_effect(sox_find_effect("trim"));
  args[0] = "10", assert(sox_effect_options(e, 1, args) == SOX_SUCCESS);
  assert(sox_add_effect(chain, e, &interm_signal, &in->signal) == SOX_SUCCESS);
  free(e);

  if (in->signal.rate != out->signal.rate) {
    e = sox_create_effect(sox_find_effect("rate"));
    assert(sox_effect_options(e, 0, NULL) == SOX_SUCCESS);
    assert(sox_add_effect(chain, e, &interm_signal, &out->signal) == SOX_SUCCESS);
    free(e);
  }

  if (in->signal.channels != out->signal.channels) {
    e = sox_create_effect(sox_find_effect("channels"));
    assert(sox_effect_options(e, 0, NULL) == SOX_SUCCESS);
    assert(sox_add_effect(chain, e, &interm_signal, &out->signal) == SOX_SUCCESS);
    free(e);
  }

  e = sox_create_effect(sox_find_effect("output"));
  args[0] = (char *)out, assert(sox_effect_options(e, 1, args) == SOX_SUCCESS);
  assert(sox_add_effect(chain, e, &interm_signal, &out->signal) == SOX_SUCCESS);
  free(e);

  sox_flow_effects(chain, NULL, NULL);

  sox_delete_effects_chain(chain);
  sox_close(out);
  sox_close(in);
  sox_quit();

  return 0;
}
Ejemplo n.º 3
0
/*
 * Reads input file and displays a few seconds of wave-form, starting from
 * a given time through the audio.   E.g. example2 song2.au 30.75 1
 */
int main(int argc, char * argv[])
{
  sox_format_t * in;
  sox_sample_t * buf;
  size_t blocks, block_size;
  /* Period of audio over which we will measure its volume in order to
   * display the wave-form: */
  static const double block_period = 0.025; /* seconds */
  double start_secs = 0, period = 2;
  char dummy;
  uint64_t seek;

  /* All libSoX applications must start by initialising the SoX library */
  assert(sox_init() == SOX_SUCCESS);

  assert(argc > 1);
  ++argv, --argc; /* Move to 1st parameter */

  /* Open the input file (with default parameters) */
  assert(in = sox_open_read(*argv, NULL, NULL, NULL));
  ++argv, --argc; /* Move past this parameter */

  if (argc) { /* If given, read the start time: */
    assert(sscanf(*argv, "%lf%c", &start_secs, &dummy) == 1);
    ++argv, --argc; /* Move past this parameter */
  }

  if (argc) { /* If given, read the period of time to display: */
    assert(sscanf(*argv, "%lf%c", &period, &dummy) == 1);
    ++argv, --argc; /* Move past this parameter */
  }

  /* Calculate the start position in number of samples: */
  seek = start_secs * in->signal.rate * in->signal.channels + .5;
  /* Make sure that this is at a `wide sample' boundary: */
  seek -= seek % in->signal.channels;
  /* Move the file pointer to the desired starting position */
  assert(sox_seek(in, seek, SOX_SEEK_SET) == SOX_SUCCESS);

  /* Convert block size (in seconds) to a number of samples: */
  block_size = block_period * in->signal.rate * in->signal.channels + .5;
  /* Make sure that this is at a `wide sample' boundary: */
  block_size -= block_size % in->signal.channels;
  /* Allocate a block of memory to store the block of audio samples: */
  assert(buf = malloc(sizeof(sox_sample_t) * block_size));

  /* This example program requires that the audio has precisely 2 channels: */
  assert(in->signal.channels == 2);

  /* Read and process blocks of audio for the selected period or until EOF: */
  for (blocks = 0; sox_read(in, buf, block_size) == block_size && blocks * block_period < period; ++blocks) {
    double left = 0, right = 0;
    size_t i;
    static const char line[] = "===================================";
    int l, r;

    for (i = 0; i < block_size; ++i) {
      SOX_SAMPLE_LOCALS;
      /* convert the sample from SoX's internal format to a `double' for
       * processing in this application: */
      double sample = SOX_SAMPLE_TO_FLOAT_64BIT(buf[i],);

      /* The samples for each channel are interleaved; in this example
       * we allow only stereo audio, so the left channel audio can be found in
       * even-numbered samples, and the right channel audio in odd-numbered
       * samples: */
      if (i & 1)
        right = max(right, fabs(sample)); /* Find the peak volume in the block */
      else
        left = max(left, fabs(sample)); /* Find the peak volume in the block */
    }

    /* Build up the wave form by displaying the left & right channel
     * volume as a line length: */
    l = (1 - left) * 35 + .5;
    r = (1 - right) * 35 + .5;
    printf("%8.3f%36s|%s\n", start_secs + blocks * block_period, line + l, line + r);
  }

  /* All done; tidy up: */
  free(buf);
  sox_close(in);
  sox_quit();
  return 0;
}
Ejemplo n.º 4
0
int main(int argc, char** argv) {
    if (argc != 2) {
        fprintf(stderr, "usage: %s input_file > output_file\n", argv[0]);
        exit(1);
    }

    const int out_channels = 2, sample_rate = 44100;

    if (sox_init() != SOX_SUCCESS) {
        oops("sox_init()");
    }

    sox_format_t* input = sox_open_read(argv[1], NULL, NULL, NULL);
    if (!input) {
        oops("sox_open_read()");
    }

    sox_signalinfo_t out_si = {};
    out_si.rate = sample_rate;
    out_si.channels = out_channels;
    out_si.precision = SOX_SAMPLE_PRECISION;

    sox_effect_handler_t out_handler = {
        "stdout", NULL, SOX_EFF_MCHAN, NULL, NULL, stdout_writer, NULL, NULL, NULL, 0
    };

    sox_effects_chain_t* chain
        = sox_create_effects_chain(&input->encoding, NULL);
    if (!chain) {
        oops("sox_create_effects_chain()");
    }

    {
        sox_effect_t* effect = sox_create_effect(sox_find_effect("input"));
        if (!effect) {
            oops("sox_create_effect(input)");
        }

        char* args[1] = { (char*)input };
        if (sox_effect_options(effect, 1, args) != SOX_SUCCESS) {
            oops("sox_effect_options(input)");
        }

        if (sox_add_effect(
                chain, effect, &input->signal, &out_si) != SOX_SUCCESS) {
            oops("sox_add_effect(input)");
        }

        free(effect);
    }

    if (input->signal.rate != out_si.rate) {
        {
            sox_effect_t* effect = sox_create_effect(sox_find_effect("gain"));
            if (!effect) {
                oops("sox_create_effect(gain)");
            }

            const char* args[] = { "-h" };

            if (sox_effect_options(effect, 1, (char**)args) != SOX_SUCCESS) {
                oops("sox_effect_options(gain)");
            }

            if (sox_add_effect(
                    chain, effect, &input->signal, &out_si) != SOX_SUCCESS) {
                oops("sox_add_effect(gain)");
            }

            free(effect);
        }

        {
            sox_effect_t* effect = sox_create_effect(sox_find_effect("rate"));
            if (!effect) {
                oops("sox_create_effect(rate)");
            }

            const char* args[] = { "-Q", "7", "-b", "99.7" };

            if (sox_effect_options(effect, 4, (char**)args) != SOX_SUCCESS) {
                oops("sox_effect_options(rate)");
            }

            if (sox_add_effect(
                    chain, effect, &input->signal, &out_si) != SOX_SUCCESS) {
                oops("sox_add_effect(rate)");
            }

            free(effect);
        }
    }

    if (input->signal.channels != out_si.channels) {
        sox_effect_t* effect = sox_create_effect(sox_find_effect("channels"));
        if (!effect) {
            oops("sox_create_effect(channels)");
        }

        if (sox_effect_options(effect, 0, NULL) != SOX_SUCCESS) {
            oops("sox_effect_options(channels)");
        }

        if (sox_add_effect(
                chain, effect, &input->signal, &out_si) != SOX_SUCCESS) {
            oops("sox_add_effect(channels)");
        }

        free(effect);
    }

    {
        sox_effect_t* effect = sox_create_effect(&out_handler);
        if (!effect) {
            oops("sox_create_effect(output)");
        }

        if (sox_add_effect(
                chain, effect, &input->signal, &out_si) != SOX_SUCCESS) {
            oops("sox_add_effect(output)");
        }

        free(effect);
    }

    sox_flow_effects(chain, NULL, NULL);

    sox_delete_effects_chain(chain);

    if (sox_close(input) != SOX_SUCCESS) {
        oops("sox_close()");
    }

    if (sox_quit() != SOX_SUCCESS) {
        oops("sox_quit()");
    }

    return 0;
}
Ejemplo n.º 5
0
/*
 * Reads input file, applies vol & flanger effects, stores in output file.
 * E.g. example1 monkey.au monkey.aiff
 */
int main(int argc, char * argv[]){

	static sox_format_t * in, * out; /* input and output files */
	sox_effects_chain_t * chain;
  	sox_effect_t * e;
  	char * args[10];

  	assert(argc == 3);

  	/* All libSoX applications must start by initialising the SoX library */
  	assert(sox_init() == SOX_SUCCESS);

  	/* Open the input file (with default parameters) */
  	assert(in = sox_open_read(argv[1], NULL, NULL, NULL));

  	/* Open the output file; we must specify the output signal characteristics.
  	* Since we are using only simple effects, they are the same as the input
  	* file characteristics */
  	assert(out = sox_open_write(argv[2], &in->signal, NULL, NULL, NULL, NULL));

  	/* Create an effects chain; some effects need to know about the input
  	* or output file encoding so we provide that information here */
  	chain = sox_create_effects_chain(&in->encoding, &out->encoding);

  	/* The first effect in the effect chain must be something that can source
   	* samples; in this case, we use the built-in handler that inputs
   	* data from an audio file */
  	e = sox_create_effect(sox_find_effect("input"));
  	args[0] = (char *)in, assert(sox_effect_options(e, 1, args) == SOX_SUCCESS);
  	/* This becomes the first `effect' in the chain */
  	assert(sox_add_effect(chain, e, &in->signal, &in->signal) == SOX_SUCCESS);

  	/* Create the `vol' effect, and initialise it with the desired parameters: */
  	e = sox_create_effect(sox_find_effect("vol"));
  	args[0] = "3dB", assert(sox_effect_options(e, 1, args) == SOX_SUCCESS);
  	/* Add the effect to the end of the effects processing chain: */
	assert(sox_add_effect(chain, e, &in->signal, &in->signal) == SOX_SUCCESS);

  	/* Create the `flanger' effect, and initialise it with default parameters: */
  	e = sox_create_effect(sox_find_effect("flanger"));
  	assert(sox_effect_options(e, 0, NULL) == SOX_SUCCESS);
  	/* Add the effect to the end of the effects processing chain: */
  	assert(sox_add_effect(chain, e, &in->signal, &in->signal) == SOX_SUCCESS);

  	/* The last effect in the effect chain must be something that only consumes
  	* samples; in this case, we use the built-in handler that outputs
   	* data to an audio file */
  	e = sox_create_effect(sox_find_effect("output"));
  	args[0] = (char *)out, assert(sox_effect_options(e, 1, args) == SOX_SUCCESS);
  	assert(sox_add_effect(chain, e, &in->signal, &in->signal) == SOX_SUCCESS);

  	/* Flow samples through the effects processing chain until EOF is reached */
  	sox_flow_effects(chain, NULL, NULL);

  	/* All done; tidy up: */
  	sox_delete_effects_chain(chain);
  	sox_close(out);
  	sox_close(in);
  	sox_quit();
  	return 0;
}
Ejemplo n.º 6
0
int main(int argc, char* argv[])
{
   static sox_format_t *in_file, *out_file;
   sox_sample_t *buffer;
   size_t read;
   size_t sample_count;
   unsigned int sample_order[SONG_LENGTH_S];

   if(argc != 3) {
      usage();
      exit(EXIT_FAILURE);
   }

   if (sox_init() != SOX_SUCCESS) {
      fprintf(stderr, "error: could not initialize Sox\n");
      exit(EXIT_FAILURE);
   }

   if((in_file = sox_open_read(argv[1], NULL, NULL, NULL)) == NULL) {
      fprintf(stderr, "error could not read input file\n");
      exit(EXIT_FAILURE);
   }

   if((out_file = sox_open_write(argv[2], &in_file->signal,
                     NULL, "wav", NULL, NULL)) == NULL) {
      fprintf(stderr, "error could not open output file\n");
      exit(EXIT_FAILURE);
   }


   sample_count = SONG_LENGTH_S * in_file->signal.rate * in_file->signal.channels;

   buffer = (sox_sample_t *) malloc(sizeof(sox_sample_t) * sample_count);

   randomize_byte_order(sample_order);

   if (sox_read(in_file, buffer, sample_count) != sample_count) {
      fprintf(stderr, "Incorrect number of samples read");
   }

   unsigned int i=0;

   for(i=0;i<SONG_LENGTH_S;i++) {
      sox_write(out_file, buffer + (sample_order[i] * (((unsigned int)(in_file->signal.rate)
                                                    * in_file->signal.channels))),
                                                    in_file->signal.rate * in_file->signal.channels);
   }

   free(buffer);

   sox_close(in_file);
   sox_close(out_file);


   sox_quit();



   return 0;

}