summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
-rw-r--r--media/audio/audio_util.cc89
-rw-r--r--media/audio/audio_util.h24
-rw-r--r--media/audio/audio_util_unittest.cc71
-rw-r--r--media/audio/win/waveout_output_win.cc25
-rw-r--r--media/audio/win/waveout_output_win.h3
5 files changed, 207 insertions, 5 deletions
diff --git a/media/audio/audio_util.cc b/media/audio/audio_util.cc
index dabe448..c1c1bc8 100644
--- a/media/audio/audio_util.cc
+++ b/media/audio/audio_util.cc
@@ -59,4 +59,93 @@ bool AdjustVolume(void* buf,
return false;
}
+// Channel order for AAC
+// From http://www.hydrogenaudio.org/forums/lofiversion/index.php/t40046.html
+// And Quicktime Pro, Movie Inspector
+const int kChannel_C = 0;
+const int kChannel_L = 1;
+const int kChannel_R = 2;
+const int kChannel_SL = 3;
+const int kChannel_SR = 4;
+const int kChannel_LFE = 5;
+
+template<class Format>
+Format ChannelsClampInternal(float val,
+ const Format min_value,
+ const Format max_value) {
+ if (val > static_cast<float>(max_value)) {
+ return max_value;
+ }
+ if (val < static_cast<float>(min_value)) {
+ return min_value;
+ }
+ return static_cast<Format>(val);
+}
+
+template<class Format>
+void FoldChannelsInternal(Format* buf_out,
+ int sample_count,
+ float volume,
+ int channels,
+ const int min_value,
+ const int max_value) {
+ Format* buf_in = buf_out;
+ // mid_value is to adjust excess 128 notation in unsigned 8 bit samples
+ // to signed before adding channels.
+ const int mid_value = (max_value + min_value + 1) / 2;
+ const float kHalfPerceived = 0.707f; // 1/sqrt(2)
+ for (int i = 0; i < sample_count; ++i) {
+ float center_half = static_cast<float>(buf_in[kChannel_C] - mid_value) * kHalfPerceived;
+ float left = static_cast<float>(buf_in[kChannel_L] - mid_value);
+ float right = static_cast<float>(buf_in[kChannel_R] - mid_value);
+ float surround_left = static_cast<float>(buf_in[kChannel_SL] - mid_value);
+ float surround_right = static_cast<float>(buf_in[kChannel_SR] - mid_value);
+ buf_out[0] = ChannelsClampInternal(
+ (left + surround_left + center_half) * volume + mid_value,
+ static_cast<Format>(min_value), static_cast<Format>(max_value));
+ buf_out[1] = ChannelsClampInternal(
+ (right + surround_right + center_half) * volume + mid_value,
+ static_cast<Format>(min_value), static_cast<Format>(max_value));
+ buf_out += 2;
+ buf_in += channels;
+ }
+}
+
+bool FoldChannels(void* buf,
+ size_t buflen,
+ int channels,
+ int bytes_per_sample,
+ float volume) {
+ DCHECK(buf);
+ DCHECK(volume >= 0.0f && volume <= 1.0f);
+ if (channels >= 5 && channels <= 6 && bytes_per_sample > 0) {
+ int sample_count = buflen / (channels * bytes_per_sample);
+ if (bytes_per_sample == 1) {
+ FoldChannelsInternal(reinterpret_cast<uint8*>(buf),
+ sample_count,
+ volume,
+ channels,
+ 0, 255);
+ return true;
+ } else if (bytes_per_sample == 2) {
+ FoldChannelsInternal(reinterpret_cast<int16*>(buf),
+ sample_count,
+ volume,
+ channels,
+ -32768,
+ 32767);
+ return true;
+ } else if (bytes_per_sample == 4) {
+ FoldChannelsInternal(reinterpret_cast<int32*>(buf),
+ sample_count,
+ volume,
+ channels,
+ 0x80000000,
+ 0x7fffffff);
+ return true;
+ }
+ }
+ return false;
+}
+
} // namespace media
diff --git a/media/audio/audio_util.h b/media/audio/audio_util.h
index 14fe169..edfe7ab 100644
--- a/media/audio/audio_util.h
+++ b/media/audio/audio_util.h
@@ -9,6 +9,11 @@
namespace media {
+// For all audio functions 3 audio formats are supported:
+// 8 bits unsigned 0 to 255.
+// 16 bit signed (little endian).
+// 32 bit signed (little endian)
+
// AdjustVolume() does a software volume adjustment of a sample buffer.
// The samples are multiplied by the volume, which should range from
// 0.0 (mute) to 1.0 (full volume).
@@ -25,6 +30,25 @@ bool AdjustVolume(void* buf,
int bytes_per_sample,
float volume);
+// FoldChannels() does a software multichannel folding down to stereo.
+// Channel order is assumed to be 5.1 Dolby standard which is
+// front left, front right, center, surround left, surround right.
+// The subwoofer is ignored.
+// 6.1 adds a rear center speaker, and 7.1 has 2 rear speakers. These
+// channels are rare and ignored.
+// After summing the channels, volume is adjusted and the samples are
+// clipped to the maximum value.
+// Volume should normally range from 0.0 (mute) to 1.0 (full volume), but
+// since clamping is performed a value of more than 1 is allowed to increase
+// volume.
+// The buffer is modified in-place to avoid memory management, as this
+// function may be called in performance critical code.
+bool FoldChannels(void* buf,
+ size_t buflen,
+ int channels,
+ int bytes_per_sample,
+ float volume);
+
} // namespace media
#endif // MEDIA_AUDIO_AUDIO_UTIL_H_
diff --git a/media/audio/audio_util_unittest.cc b/media/audio/audio_util_unittest.cc
index 415a108..aa5df4c 100644
--- a/media/audio/audio_util_unittest.cc
+++ b/media/audio/audio_util_unittest.cc
@@ -50,6 +50,19 @@ TEST(AudioUtilTest, AdjustVolume_s16_zero) {
EXPECT_EQ(0, expected_test);
}
+TEST(AudioUtilTest, AdjustVolume_s16_one) {
+ // Test AdjustVolume() on 16 bit samples.
+ int16 samples_s16[kNumberOfSamples] = { -4, 0x40, -32768, 123 };
+ int16 expected_s16[kNumberOfSamples] = { -4, 0x40, -32768, 123 };
+ bool result_s16 = media::AdjustVolume(samples_s16, sizeof(samples_s16),
+ 2, // channels.
+ sizeof(samples_s16[0]),
+ 1.0f);
+ EXPECT_EQ(true, result_s16);
+ int expected_test = memcmp(samples_s16, expected_s16, sizeof(expected_s16));
+ EXPECT_EQ(0, expected_test);
+}
+
TEST(AudioUtilTest, AdjustVolume_s32) {
// Test AdjustVolume() on 32 bit samples.
int32 samples_s32[kNumberOfSamples] = { -4, 0x40, -32768, 123 };
@@ -63,4 +76,62 @@ TEST(AudioUtilTest, AdjustVolume_s32) {
EXPECT_EQ(0, expected_test);
}
+TEST(AudioUtilTest, FoldChannels_u8) {
+ // Test AdjustVolume() on 16 bit samples.
+ uint8 samples_u8[6] = { 130, 100, 150, 70, 130, 170 };
+ uint8 expected_u8[2] = { 43, 153 };
+ bool result_u8 = media::FoldChannels(samples_u8, sizeof(samples_u8),
+ 6, // channels.
+ sizeof(samples_u8[0]),
+ 1.0f);
+ EXPECT_EQ(true, result_u8);
+ int expected_test = memcmp(samples_u8, expected_u8, sizeof(expected_u8));
+ EXPECT_EQ(0, expected_test);
+}
+
+TEST(AudioUtilTest, FoldChannels_s16) {
+ // Test AdjustVolume() on 16 bit samples.
+ int16 samples_s16[6] = { 12, 1, 3, 7, 13, 17 };
+ int16 expected_s16[2] = { static_cast<int16>(12 * .707 + 1 + 7),
+ static_cast<int16>(12 * .707 + 3 + 13) };
+ bool result_s16 = media::FoldChannels(samples_s16, sizeof(samples_s16),
+ 6, // channels.
+ sizeof(samples_s16[0]),
+ 1.00f);
+ EXPECT_EQ(true, result_s16);
+ int expected_test = memcmp(samples_s16, expected_s16, sizeof(expected_s16));
+ EXPECT_EQ(0, expected_test);
+}
+
+TEST(AudioUtilTest, FoldChannels_s32) {
+ // Test AdjustVolume() on 16 bit samples.
+ int32 samples_s32[6] = { 12, 1, 3, 7, 13, 17 };
+ int32 expected_s32[2] = { static_cast<int16>(12 * .707 + 1 + 7),
+ static_cast<int16>(12 * .707 + 3 + 13) };
+ bool result_s32 = media::FoldChannels(samples_s32, sizeof(samples_s32),
+ 6, // channels.
+ sizeof(samples_s32[0]),
+ 1.00f);
+ EXPECT_EQ(true, result_s32);
+ int expected_test = memcmp(samples_s32, expected_s32, sizeof(expected_s32));
+ EXPECT_EQ(0, expected_test);
+}
+
+// This mimics 1 second of audio at 48000 samples per second.
+// Running the unittest will produce timing.
+TEST(AudioUtilTest, FoldChannels_s16_benchmark) {
+ const int kBufferSize = 1024 * 6;
+ // Test AdjustVolume() on 16 bit samples.
+ for (int i = 0; i < 48000; ++i) {
+ int16 samples_s16[kBufferSize];
+ for (int j = 0; j < kBufferSize; ++j)
+ samples_s16[j] = j;
+
+ bool result_s16 = media::FoldChannels(samples_s16, sizeof(samples_s16),
+ 6, // channels.
+ sizeof(samples_s16[0]),
+ 0.5f);
+ EXPECT_EQ(true, result_s16);
+ }
+}
} // namespace media
diff --git a/media/audio/win/waveout_output_win.cc b/media/audio/win/waveout_output_win.cc
index 124d8e7..40d17d3 100644
--- a/media/audio/win/waveout_output_win.cc
+++ b/media/audio/win/waveout_output_win.cc
@@ -29,6 +29,9 @@
// to make sure we are not executing inside the audio source's OnMoreData()
// or that we take locks inside WaveCallback() or QueueNextPacket().
+// Enable or disable software folding
+#define FOLDING 1
+
namespace {
// We settled for a double buffering scheme. It seems to strike a good balance
@@ -56,9 +59,14 @@ PCMWaveOutAudioOutputStream::PCMWaveOutAudioOutputStream(
callback_(NULL),
buffer_(NULL),
buffer_size_(0),
- volume_(1) {
+ volume_(1),
+ channels_(channels) {
format_.wFormatTag = WAVE_FORMAT_PCM;
+#ifdef FOLDING
+ format_.nChannels = channels > 2 ? 2 : channels;
+#else
format_.nChannels = channels;
+#endif
format_.nSamplesPerSec = sampling_rate;
format_.wBitsPerSample = bits_per_sample;
format_.cbSize = 0;
@@ -226,10 +234,17 @@ void PCMWaveOutAudioOutputStream::QueueNextPacket(WAVEHDR *buffer) {
// TODO(fbarchard): Handle used 0 by queueing more.
size_t used = callback_->OnMoreData(this, buffer->lpData, buffer_size_);
if (used <= buffer_size_) {
- buffer->dwBufferLength = used;
- media::AdjustVolume(buffer->lpData, buffer->dwBufferLength,
- format_.nChannels, format_.wBitsPerSample >> 3,
- volume_);
+ buffer->dwBufferLength = used * format_.nChannels / channels_;
+ if (channels_ > 2 && format_.nChannels == 2) {
+ media::FoldChannels(buffer->lpData, used,
+ channels_, format_.wBitsPerSample >> 3,
+ volume_);
+ } else {
+ media::AdjustVolume(buffer->lpData, used,
+ format_.nChannels, format_.wBitsPerSample >> 3,
+ volume_);
+ }
+
} else {
HandleError(0);
return;
diff --git a/media/audio/win/waveout_output_win.h b/media/audio/win/waveout_output_win.h
index 3f822e9..e072851 100644
--- a/media/audio/win/waveout_output_win.h
+++ b/media/audio/win/waveout_output_win.h
@@ -86,6 +86,9 @@ class PCMWaveOutAudioOutputStream : public AudioOutputStream {
// Volume level from 0 to 1.
float volume_;
+ // Channels from 0 to 6.
+ int channels_;
+
// The id assigned by the operating system to the selected wave output
// hardware device. Usually this is just -1 which means 'default device'.
UINT device_id_;