octave-nkf: libinterp/dldfcn/audiodevinfo.cc comparison

comparison libinterp/dldfcn/audiodevinfo.cc @ 19589:9bd2f0a07c95

improve performance of audio callback functions * audiodevinfo.cc (octave_play_callback, portaudio_play_callback): Avoid unnecessary copying of data.

author	John W. Eaton <jwe@octave.org>
date	Fri, 09 Jan 2015 13:19:50 -0500
parents	8dce81f7448d
children	d7057df2968e

comparison

equal deleted inserted replaced

-:398e42431dcc
+:9bd2f0a07c95
 {
 error ("audio player callback function failed");
 return paAbort;
 }
-Matrix sound = retval(0).matrix_value ();
+const Matrix sound = retval(0).matrix_value ();
 int return_status = retval(1).int_value ();
 if (error_state || frames != sound.rows ()
 || sound.columns () < 1 || sound.columns () > 2)
 {
 error ("audio player callback function failed");
 return paAbort;
 }
-double scale_factor = 1.0;
+// Don't multiply the audio data by scale_factor here.  Although it
+// does move the operation outside of the loops below, it also causes
-switch (player->get_nbits ())
+// a second copy of the data array to be made.
-{
-case 8:
+const ColumnVector sound_l = sound.column (0);
-scale_factor = pow (2.0, 7) - 1.0;
+const ColumnVector sound_r = (sound.columns () == 1)
-break;
+? sound_l : sound.column (1);
-case 16:
-scale_factor = pow (2.0, 15) - 1.0;
-break;
-case 24:
-scale_factor = pow (2.0, 23) - 1.0;
-break;
-default:
-error ("invalid player bit depth in callback function");
-break;
-}
-sound = sound * scale_factor;
-const RowVector sound_l = (sound.column (0)).transpose ();
-const RowVector sound_r = (sound.columns () == 1)
-? sound_l : (sound.column (1)).transpose ();
 const double *p_l = sound_l.data ();
 const double *p_r = sound_r.data ();
 switch (player->get_nbits ())
 {
 case 8:
 {
+static double scale_factor = pow (2.0, 7) - 1.0;
 int8_t *buffer = static_cast<int8_t *> (output);
 for (unsigned long i = 0; i < frames; i++)
 {
-buffer[2*i] = p_l[i];
+buffer[2*i] = p_l[i] * scale_factor;
-buffer[2*i+1] = p_r[i];
+buffer[2*i+1] = p_r[i] * scale_factor;
 }
 }
 break;
 case 16:
 {
+static double scale_factor = pow (2.0, 15) - 1.0;
 int16_t *buffer = static_cast<int16_t *> (output);
 for (unsigned long i = 0; i < frames; i++)
 {
-buffer[2*i] = p_l[i];
+buffer[2*i] = p_l[i] * scale_factor;
-buffer[2*i+1] = p_r[i];
+buffer[2*i+1] = p_r[i] * scale_factor;
 }
 }
 break;
 case 24:
 {
-int big_endian = is_big_endian ();
+static double scale_factor = pow (2.0, 23) - 1.0;
+static int big_endian = is_big_endian ();
 uint8_t *buffer = static_cast<uint8_t *> (output);
 for (unsigned long i = 0; i < frames; i++)
 {
 uint8_t *_sample_l = reinterpret_cast<uint8_t *> (&sample_l);
 uint8_t *_sample_r = reinterpret_cast<uint8_t *> (&sample_r);
 unsigned long offset = i * 6;
-buffer[offset+0] = _sample_l[0+big_endian];
+buffer[offset+0] = _sample_l[0+big_endian] * scale_factor;
-buffer[offset+1] = _sample_l[1+big_endian];
+buffer[offset+1] = _sample_l[1+big_endian] * scale_factor;
-buffer[offset+2] = _sample_l[2+big_endian];
+buffer[offset+2] = _sample_l[2+big_endian] * scale_factor;
-buffer[offset+3] = _sample_r[0+big_endian];
+buffer[offset+3] = _sample_r[0+big_endian] * scale_factor;
-buffer[offset+4] = _sample_r[1+big_endian];
+buffer[offset+4] = _sample_r[1+big_endian] * scale_factor;
-buffer[offset+5] = _sample_r[2+big_endian];
+buffer[offset+5] = _sample_r[2+big_endian] * scale_factor;
 }
 }
 break;
 default:
 {
 error ("audio player callback function called without player");
 return paAbort;
 }
-double scale_factor = 1.0;
+// Don't multiply the audio data by scale_factor here.  Although it
+// would move the operation outside of the loops below, it also causes
-switch (player->get_nbits ())
+// a second copy of the *entire* data array to be made when only a
-{
+// small portion (BUFFER_SIZE elements) is usually needed for this
-case 8:
+// callback.
-scale_factor = pow (2.0, 7) - 1.0;
-break;
+const RowVector sound_l = player->get_left ();
+const RowVector sound_r = player->get_right ();
-case 16:
-scale_factor = pow (2.0, 15) - 1.0;
-break;
-case 24:
-scale_factor = pow (2.0, 23) - 1.0;
-break;
-default:
-error ("invalid player bit depth in callback function");
-break;
-}
-const RowVector sound_l = player->get_left () * scale_factor;
-const RowVector sound_r = player->get_right () * scale_factor;
 const double *pl = sound_l.data ();
 const double *pr = sound_l.data ();
 if (player->get_type () == DOUBLE)
 {
 switch (player->get_nbits ())
 {
 case 8:
 {
+static double scale_factor = pow (2.0, 7) - 1.0;
 int8_t *buffer = static_cast<int8_t *> (output);
 for (unsigned long j = 0; j < frames; j++)
 {
 unsigned int sample_number = player->get_sample_number ();
 if (sample_number >= player->get_end_sample ())
 return paComplete;
 unsigned long offset = j * 2;
-buffer[offset+0] = pl[sample_number];
+buffer[offset+0] = pl[sample_number] * scale_factor;
-buffer[offset+1] = pr[sample_number];
+buffer[offset+1] = pr[sample_number] * scale_factor;
 player->set_sample_number (sample_number + 1);
 }
 }
 break;
 case 16:
 {
+static double scale_factor = pow (2.0, 15) - 1.0;
 int16_t *buffer = static_cast<int16_t *> (output);
 for (unsigned long j = 0; j < frames; j++)
 {
 unsigned int sample_number = player->get_sample_number ();
 if (sample_number >= player->get_end_sample ())
 return paComplete;
 unsigned long offset = j * 2;
-buffer[offset+0] = pl[sample_number];
+buffer[offset+0] = pl[sample_number] * scale_factor;
-buffer[offset+1] = pr[sample_number];
+buffer[offset+1] = pr[sample_number] * scale_factor;
 player->set_sample_number (sample_number + 1);
 }
 }
 break;
 case 24:
 {
+static double scale_factor = pow (2.0, 23) - 1.0;
+static int big_endian = is_big_endian ();
 uint8_t *buffer = static_cast<uint8_t *> (output);
 for (unsigned long j = 0; j < frames; j++)
 {
 unsigned int sample_number = player->get_sample_number ();
 if (sample_number >= player->get_end_sample ())
 return paComplete;
-int32_t sample_l = pl[sample_number];
+int32_t sample_l = pl[sample_number] * scale_factor;
-int32_t sample_r = pr[sample_number];
+int32_t sample_r = pr[sample_number] * scale_factor;
 sample_l &= 0x00ffffff;
 sample_r &= 0x00ffffff;
-int big_endian = is_big_endian ();
 // FIXME: Would a mask work better?
 uint8_t *_sample_l = reinterpret_cast<uint8_t *> (&sample_l);
 uint8_t *_sample_r = reinterpret_cast<uint8_t *> (&sample_r);

Mercurial > octave-nkf

comparison libinterp/dldfcn/audiodevinfo.cc @ 19589:9bd2f0a07c95