Adds stereo support for Java-based input and output audio on Android

BUG=webrtc:6718 Review-Url: https://codereview.webrtc.org/2499613002 Cr-Commit-Position: refs/heads/master@{#15104}
2016-11-16 06:30:46 -08:00 · 2016-11-16 06:30:46 -08:00 · 779017d989
commit 779017d989
parent b1ddbf9a94
8 changed files with 84 additions and 57 deletions
--- a/webrtc/modules/audio_device/android/audio_common.h
+++ b/webrtc/modules/audio_device/android/audio_common.h
@ -14,10 +14,6 @@
 namespace webrtc {

 const int kDefaultSampleRate = 44100;
-const int kNumChannels = 1;
-// Number of bytes per audio frame.
-// Example: 16-bit PCM in mono => 1*(16/8)=2 [bytes/frame]
-const size_t kBytesPerFrame = kNumChannels * (16 / 8);
 // Delay estimates for the two different supported modes. These values are based
 // on real-time round-trip delay estimates on a large set of devices and they
 // are lower bounds since the filter length is 128 ms, so the AEC works for
--- a/webrtc/modules/audio_device/android/audio_manager.cc
+++ b/webrtc/modules/audio_device/android/audio_manager.cc
@ -78,7 +78,7 @@ AudioManager::AudioManager()
  ALOGD("ctor%s", GetThreadInfo().c_str());
  RTC_CHECK(j_environment_);
  JNINativeMethod native_methods[] = {
-      {"nativeCacheAudioParameters", "(IIZZZZZZIIJ)V",
+      {"nativeCacheAudioParameters", "(IIIZZZZZZIIJ)V",
       reinterpret_cast<void*>(&webrtc::AudioManager::CacheAudioParameters)}};
  j_native_registration_ = j_environment_->RegisterNatives(
      "org/webrtc/voiceengine/WebRtcAudioManager", native_methods,
@ -228,7 +228,8 @@ int AudioManager::GetDelayEstimateInMilliseconds() const {
 void JNICALL AudioManager::CacheAudioParameters(JNIEnv* env,
                                                jobject obj,
                                                jint sample_rate,
-                                                jint channels,
+                                                jint output_channels,
+                                                jint input_channels,
                                                jboolean hardware_aec,
                                                jboolean hardware_agc,
                                                jboolean hardware_ns,
@ -241,14 +242,15 @@ void JNICALL AudioManager::CacheAudioParameters(JNIEnv* env,
  webrtc::AudioManager* this_object =
      reinterpret_cast<webrtc::AudioManager*>(native_audio_manager);
  this_object->OnCacheAudioParameters(
-      env, sample_rate, channels, hardware_aec, hardware_agc, hardware_ns,
-      low_latency_output, low_latency_input, pro_audio, output_buffer_size,
-      input_buffer_size);
+      env, sample_rate, output_channels, input_channels, hardware_aec,
+      hardware_agc, hardware_ns, low_latency_output, low_latency_input,
+      pro_audio, output_buffer_size, input_buffer_size);
 }

 void AudioManager::OnCacheAudioParameters(JNIEnv* env,
                                          jint sample_rate,
-                                          jint channels,
+                                          jint output_channels,
+                                          jint input_channels,
                                          jboolean hardware_aec,
                                          jboolean hardware_agc,
                                          jboolean hardware_ns,
@ -265,7 +267,8 @@ void AudioManager::OnCacheAudioParameters(JNIEnv* env,
  ALOGD("low_latency_input: %d", low_latency_input);
  ALOGD("pro_audio: %d", pro_audio);
  ALOGD("sample_rate: %d", sample_rate);
-  ALOGD("channels: %d", channels);
+  ALOGD("output_channels: %d", output_channels);
+  ALOGD("input_channels: %d", input_channels);
  ALOGD("output_buffer_size: %d", output_buffer_size);
  ALOGD("input_buffer_size: %d", input_buffer_size);
  RTC_DCHECK(thread_checker_.CalledOnValidThread());
@ -275,10 +278,9 @@ void AudioManager::OnCacheAudioParameters(JNIEnv* env,
  low_latency_playout_ = low_latency_output;
  low_latency_record_ = low_latency_input;
  pro_audio_ = pro_audio;
-  // TODO(henrika): add support for stereo output.
-  playout_parameters_.reset(sample_rate, static_cast<size_t>(channels),
+  playout_parameters_.reset(sample_rate, static_cast<size_t>(output_channels),
                            static_cast<size_t>(output_buffer_size));
-  record_parameters_.reset(sample_rate, static_cast<size_t>(channels),
+  record_parameters_.reset(sample_rate, static_cast<size_t>(input_channels),
                           static_cast<size_t>(input_buffer_size));
 }

--- a/webrtc/modules/audio_device/android/audio_manager.h
+++ b/webrtc/modules/audio_device/android/audio_manager.h
@ -120,7 +120,8 @@ class AudioManager {
  static void JNICALL CacheAudioParameters(JNIEnv* env,
                                           jobject obj,
                                           jint sample_rate,
-                                           jint channels,
+                                           jint output_channels,
+                                           jint input_channels,
                                           jboolean hardware_aec,
                                           jboolean hardware_agc,
                                           jboolean hardware_ns,
@ -132,7 +133,8 @@ class AudioManager {
                                           jlong native_audio_manager);
  void OnCacheAudioParameters(JNIEnv* env,
                              jint sample_rate,
-                              jint channels,
+                              jint output_channels,
+                              jint input_channels,
                              jboolean hardware_aec,
                              jboolean hardware_agc,
                              jboolean hardware_ns,
--- a/webrtc/modules/audio_device/android/audio_record_jni.cc
+++ b/webrtc/modules/audio_device/android/audio_record_jni.cc
@ -132,8 +132,9 @@ int32_t AudioRecordJni::InitRecording() {
  }
  frames_per_buffer_ = static_cast<size_t>(frames_per_buffer);
  ALOGD("frames_per_buffer: %" PRIuS, frames_per_buffer_);
+  const size_t bytes_per_frame = audio_parameters_.channels() * sizeof(int16_t);
  RTC_CHECK_EQ(direct_buffer_capacity_in_bytes_,
-               frames_per_buffer_ * kBytesPerFrame);
+               frames_per_buffer_ * bytes_per_frame);
  RTC_CHECK_EQ(frames_per_buffer_, audio_parameters_.frames_per_10ms_buffer());
  initialized_ = true;
  return 0;
--- a/webrtc/modules/audio_device/android/audio_track_jni.cc
+++ b/webrtc/modules/audio_device/android/audio_track_jni.cc
@ -227,7 +227,8 @@ void AudioTrackJni::OnCacheDirectBufferAddress(
  jlong capacity = env->GetDirectBufferCapacity(byte_buffer);
  ALOGD("direct buffer capacity: %lld", capacity);
  direct_buffer_capacity_in_bytes_ = static_cast<size_t>(capacity);
-  frames_per_buffer_ = direct_buffer_capacity_in_bytes_ / kBytesPerFrame;
+  const size_t bytes_per_frame = audio_parameters_.channels() * sizeof(int16_t);
+  frames_per_buffer_ = direct_buffer_capacity_in_bytes_ / bytes_per_frame;
  ALOGD("frames_per_buffer: %" PRIuS, frames_per_buffer_);
 }

@ -242,7 +243,8 @@ void JNICALL AudioTrackJni::GetPlayoutData(
 // the thread is 'AudioRecordTrack'.
 void AudioTrackJni::OnGetPlayoutData(size_t length) {
  RTC_DCHECK(thread_checker_java_.CalledOnValidThread());
-  RTC_DCHECK_EQ(frames_per_buffer_, length / kBytesPerFrame);
+  const size_t bytes_per_frame = audio_parameters_.channels() * sizeof(int16_t);
+  RTC_DCHECK_EQ(frames_per_buffer_, length / bytes_per_frame);
  if (!audio_device_buffer_) {
    ALOGE("AttachAudioBuffer has not been called!");
    return;
@ -257,7 +259,7 @@ void AudioTrackJni::OnGetPlayoutData(size_t length) {
  // Copy decoded data into common byte buffer to ensure that it can be
  // written to the Java based audio track.
  samples = audio_device_buffer_->GetPlayoutData(direct_buffer_address_);
-  RTC_DCHECK_EQ(length, kBytesPerFrame * samples);
+  RTC_DCHECK_EQ(length, bytes_per_frame * samples);
 }

 }  // namespace webrtc
--- a/webrtc/modules/audio_device/android/java/src/org/webrtc/voiceengine/WebRtcAudioManager.java
+++ b/webrtc/modules/audio_device/android/java/src/org/webrtc/voiceengine/WebRtcAudioManager.java
@ -38,27 +38,46 @@ public class WebRtcAudioManager {

  private static final String TAG = "WebRtcAudioManager";

+  // Use mono as default for both audio directions.
+  private static boolean useStereoOutput = false;
+  private static boolean useStereoInput = false;
+
  private static boolean blacklistDeviceForOpenSLESUsage = false;
  private static boolean blacklistDeviceForOpenSLESUsageIsOverridden = false;

-  // Call this method to override the deault list of blacklisted devices
+  // Call this method to override the default list of blacklisted devices
  // specified in WebRtcAudioUtils.BLACKLISTED_OPEN_SL_ES_MODELS.
-  // Allows an app to take control over which devices to exlude from using
+  // Allows an app to take control over which devices to exclude from using
  // the OpenSL ES audio output path
  public static synchronized void setBlacklistDeviceForOpenSLESUsage(boolean enable) {
    blacklistDeviceForOpenSLESUsageIsOverridden = true;
    blacklistDeviceForOpenSLESUsage = enable;
  }

+  // Call these methods to override the default mono audio modes for the specified direction(s)
+  // (input and/or output).
+  public static synchronized void setStereoOutput(boolean enable) {
+    Logging.w(TAG, "Overriding default output behavior: setStereoOutput(" + enable + ')');
+    useStereoOutput = enable;
+  }
+  public static synchronized void setStereoInput(boolean enable) {
+    Logging.w(TAG, "Overriding default input behavior: setStereoInput(" + enable + ')');
+    useStereoInput = enable;
+  }
+
+  public static synchronized boolean getStereoOutput() {
+    return useStereoOutput;
+  }
+  public static synchronized boolean getStereoInput() {
+    return useStereoInput;
+  }
+
  // Default audio data format is PCM 16 bit per sample.
  // Guaranteed to be supported by all devices.
  private static final int BITS_PER_SAMPLE = 16;

  private static final int DEFAULT_FRAME_PER_BUFFER = 256;

-  // TODO(henrika): add stereo support for playout.
-  private static final int CHANNELS = 1;
-
  // List of possible audio modes.
  private static final String[] AUDIO_MODES = new String[] {
      "MODE_NORMAL", "MODE_RINGTONE", "MODE_IN_CALL", "MODE_IN_COMMUNICATION",
@ -132,7 +151,8 @@ public class WebRtcAudioManager {
  private boolean lowLatencyInput;
  private boolean proAudio;
  private int sampleRate;
-  private int channels;
+  private int outputChannels;
+  private int inputChannels;
  private int outputBufferSize;
  private int inputBufferSize;

@ -148,8 +168,8 @@ public class WebRtcAudioManager {
    }
    volumeLogger = new VolumeLogger(audioManager);
    storeAudioParameters();
-    nativeCacheAudioParameters(sampleRate, channels, hardwareAEC, hardwareAGC, hardwareNS,
-        lowLatencyOutput, lowLatencyInput, proAudio, outputBufferSize, inputBufferSize,
+    nativeCacheAudioParameters(sampleRate, outputChannels, inputChannels, hardwareAEC, hardwareAGC,
+        hardwareNS, lowLatencyOutput, lowLatencyInput, proAudio, outputBufferSize, inputBufferSize,
        nativeAudioManager);
  }

@ -187,9 +207,8 @@ public class WebRtcAudioManager {
  }

  private void storeAudioParameters() {
-    // Only mono is supported currently (in both directions).
-    // TODO(henrika): add support for stereo playout.
-    channels = CHANNELS;
+    outputChannels = getStereoOutput() ? 2 : 1;
+    inputChannels = getStereoInput() ? 2 : 1;
    sampleRate = getNativeOutputSampleRate();
    hardwareAEC = isAcousticEchoCancelerSupported();
    // TODO(henrika): use of hardware AGC is no longer supported. Currently
@ -200,9 +219,9 @@ public class WebRtcAudioManager {
    lowLatencyInput = isLowLatencyInputSupported();
    proAudio = isProAudioSupported();
    outputBufferSize = lowLatencyOutput ? getLowLatencyOutputFramesPerBuffer()
-                                        : getMinOutputFrameSize(sampleRate, channels);
+                                        : getMinOutputFrameSize(sampleRate, outputChannels);
    inputBufferSize = lowLatencyInput ? getLowLatencyInputFramesPerBuffer()
-                                      : getMinInputFrameSize(sampleRate, channels);
+                                      : getMinInputFrameSize(sampleRate, inputChannels);
  }

  // Gets the current earpiece state.
@ -298,14 +317,8 @@ public class WebRtcAudioManager {
  // lacks support of low-latency output.
  private static int getMinOutputFrameSize(int sampleRateInHz, int numChannels) {
    final int bytesPerFrame = numChannels * (BITS_PER_SAMPLE / 8);
-    final int channelConfig;
-    if (numChannels == 1) {
-      channelConfig = AudioFormat.CHANNEL_OUT_MONO;
-    } else if (numChannels == 2) {
-      channelConfig = AudioFormat.CHANNEL_OUT_STEREO;
-    } else {
-      return -1;
-    }
+    final int channelConfig =
+        (numChannels == 1 ? AudioFormat.CHANNEL_OUT_MONO : AudioFormat.CHANNEL_OUT_STEREO);
    return AudioTrack.getMinBufferSize(
               sampleRateInHz, channelConfig, AudioFormat.ENCODING_PCM_16BIT)
        / bytesPerFrame;
@ -322,9 +335,10 @@ public class WebRtcAudioManager {
  // lacks support of low-latency input.
  private static int getMinInputFrameSize(int sampleRateInHz, int numChannels) {
    final int bytesPerFrame = numChannels * (BITS_PER_SAMPLE / 8);
-    assertTrue(numChannels == CHANNELS);
+    final int channelConfig =
+        (numChannels == 1 ? AudioFormat.CHANNEL_IN_MONO : AudioFormat.CHANNEL_IN_STEREO);
    return AudioRecord.getMinBufferSize(
-               sampleRateInHz, AudioFormat.CHANNEL_IN_MONO, AudioFormat.ENCODING_PCM_16BIT)
+               sampleRateInHz, channelConfig, AudioFormat.ENCODING_PCM_16BIT)
        / bytesPerFrame;
  }

@ -341,7 +355,8 @@ public class WebRtcAudioManager {
    }
  }

-  private native void nativeCacheAudioParameters(int sampleRate, int channels, boolean hardwareAEC,
-      boolean hardwareAGC, boolean hardwareNS, boolean lowLatencyOutput, boolean lowLatencyInput,
-      boolean proAudio, int outputBufferSize, int inputBufferSize, long nativeAudioManager);
+  private native void nativeCacheAudioParameters(int sampleRate, int outputChannels,
+      int inputChannels, boolean hardwareAEC, boolean hardwareAGC, boolean hardwareNS,
+      boolean lowLatencyOutput, boolean lowLatencyInput, boolean proAudio, int outputBufferSize,
+      int inputBufferSize, long nativeAudioManager);
 }
--- a/webrtc/modules/audio_device/android/java/src/org/webrtc/voiceengine/WebRtcAudioRecord.java
+++ b/webrtc/modules/audio_device/android/java/src/org/webrtc/voiceengine/WebRtcAudioRecord.java
@ -170,8 +170,9 @@ public class WebRtcAudioRecord {
    // Get the minimum buffer size required for the successful creation of
    // an AudioRecord object, in byte units.
    // Note that this size doesn't guarantee a smooth recording under load.
-    int minBufferSize = AudioRecord.getMinBufferSize(
-        sampleRate, AudioFormat.CHANNEL_IN_MONO, AudioFormat.ENCODING_PCM_16BIT);
+    final int channelConfig = channelCountToConfiguration(channels);
+    int minBufferSize =
+        AudioRecord.getMinBufferSize(sampleRate, channelConfig, AudioFormat.ENCODING_PCM_16BIT);
    if (minBufferSize == AudioRecord.ERROR || minBufferSize == AudioRecord.ERROR_BAD_VALUE) {
      Logging.e(TAG, "AudioRecord.getMinBufferSize failed: " + minBufferSize);
      return -1;
@ -184,8 +185,8 @@ public class WebRtcAudioRecord {
    int bufferSizeInBytes = Math.max(BUFFER_SIZE_FACTOR * minBufferSize, byteBuffer.capacity());
    Logging.d(TAG, "bufferSizeInBytes: " + bufferSizeInBytes);
    try {
-      audioRecord = new AudioRecord(AudioSource.VOICE_COMMUNICATION, sampleRate,
-          AudioFormat.CHANNEL_IN_MONO, AudioFormat.ENCODING_PCM_16BIT, bufferSizeInBytes);
+      audioRecord = new AudioRecord(AudioSource.VOICE_COMMUNICATION, sampleRate, channelConfig,
+          AudioFormat.ENCODING_PCM_16BIT, bufferSizeInBytes);
    } catch (IllegalArgumentException e) {
      Logging.e(TAG, e.getMessage());
      return -1;
@ -246,7 +247,7 @@ public class WebRtcAudioRecord {
  // created instance uses the parameters that we asked for.
  private boolean areParametersValid(int sampleRate, int channels) {
    return (audioRecord.getAudioFormat() == AudioFormat.ENCODING_PCM_16BIT
-        && audioRecord.getChannelConfiguration() == AudioFormat.CHANNEL_IN_MONO
+        && audioRecord.getChannelConfiguration() == channelCountToConfiguration(channels)
        && audioRecord.getAudioSource() == AudioSource.VOICE_COMMUNICATION
        && audioRecord.getSampleRate() == sampleRate && audioRecord.getChannelCount() == channels);
  }
@ -273,6 +274,10 @@ public class WebRtcAudioRecord {
    }
  }

+  private int channelCountToConfiguration(int channels) {
+    return (channels == 1 ? AudioFormat.CHANNEL_IN_MONO : AudioFormat.CHANNEL_IN_STEREO);
+  }
+
  private native void nativeCacheDirectBufferAddress(ByteBuffer byteBuffer, long nativeAudioRecord);

  private native void nativeDataIsRecorded(int bytes, long nativeAudioRecord);
--- a/webrtc/modules/audio_device/android/java/src/org/webrtc/voiceengine/WebRtcAudioTrack.java
+++ b/webrtc/modules/audio_device/android/java/src/org/webrtc/voiceengine/WebRtcAudioTrack.java
@ -174,8 +174,9 @@ public class WebRtcAudioTrack {
    // AudioTrack object to be created in the MODE_STREAM mode.
    // Note that this size doesn't guarantee a smooth playback under load.
    // TODO(henrika): should we extend the buffer size to avoid glitches?
-    final int minBufferSizeInBytes = AudioTrack.getMinBufferSize(
-        sampleRate, AudioFormat.CHANNEL_OUT_MONO, AudioFormat.ENCODING_PCM_16BIT);
+    final int channelConfig = channelCountToConfiguration(channels);
+    final int minBufferSizeInBytes =
+        AudioTrack.getMinBufferSize(sampleRate, channelConfig, AudioFormat.ENCODING_PCM_16BIT);
    Logging.d(TAG, "AudioTrack.getMinBufferSize: " + minBufferSizeInBytes);
    // For the streaming mode, data must be written to the audio sink in
    // chunks of size (given by byteBuffer.capacity()) less than or equal
@ -197,9 +198,8 @@ public class WebRtcAudioTrack {
      // Create an AudioTrack object and initialize its associated audio buffer.
      // The size of this buffer determines how long an AudioTrack can play
      // before running out of data.
-      audioTrack =
-          new AudioTrack(AudioManager.STREAM_VOICE_CALL, sampleRate, AudioFormat.CHANNEL_OUT_MONO,
-              AudioFormat.ENCODING_PCM_16BIT, minBufferSizeInBytes, AudioTrack.MODE_STREAM);
+      audioTrack = new AudioTrack(AudioManager.STREAM_VOICE_CALL, sampleRate, channelConfig,
+          AudioFormat.ENCODING_PCM_16BIT, minBufferSizeInBytes, AudioTrack.MODE_STREAM);
    } catch (IllegalArgumentException e) {
      Logging.d(TAG, e.getMessage());
      return false;
@ -285,7 +285,7 @@ public class WebRtcAudioTrack {
  private boolean areParametersValid(int sampleRate, int channels) {
    final int streamType = audioTrack.getStreamType();
    return (audioTrack.getAudioFormat() == AudioFormat.ENCODING_PCM_16BIT
-        && audioTrack.getChannelConfiguration() == AudioFormat.CHANNEL_OUT_MONO
+        && audioTrack.getChannelConfiguration() == channelCountToConfiguration(channels)
        && streamType == AudioManager.STREAM_VOICE_CALL && audioTrack.getSampleRate() == sampleRate
        && sampleRate == audioTrack.getNativeOutputSampleRate(streamType)
        && audioTrack.getChannelCount() == channels);
@ -332,6 +332,10 @@ public class WebRtcAudioTrack {
    }
  }

+  private int channelCountToConfiguration(int channels) {
+    return (channels == 1 ? AudioFormat.CHANNEL_OUT_MONO : AudioFormat.CHANNEL_OUT_STEREO);
+  }
+
  private native void nativeCacheDirectBufferAddress(ByteBuffer byteBuffer, long nativeAudioRecord);

  private native void nativeGetPlayoutData(int bytes, long nativeAudioRecord);