Refactoring for typing detection

R=henrika@webrtc.org Review URL: https://webrtc-codereview.appspot.com/1370004 git-svn-id: http://webrtc.googlecode.com/svn/trunk@3976 4adac7df-926f-26a2-2b94-8c16560cd09d
2013-05-07 21:04:24 +00:00 · 2013-05-07 21:04:24 +00:00 · 3be565b502
commit 3be565b502
parent ef14488d03
19 changed files with 79 additions and 53 deletions
--- a/webrtc/modules/audio_device/audio_device_buffer.cc
+++ b/webrtc/modules/audio_device/audio_device_buffer.cc
@ -46,6 +46,7 @@ AudioDeviceBuffer::AudioDeviceBuffer() :
    _playFile(*FileWrapper::Create()),
    _currentMicLevel(0),
    _newMicLevel(0),
+    _typingStatus(false),
    _playDelayMS(0),
    _recDelayMS(0),
    _clockDrift(0) {
@ -266,6 +267,12 @@ int32_t AudioDeviceBuffer::SetCurrentMicLevel(uint32_t level)
    return 0;
 }

+int32_t AudioDeviceBuffer::SetTypingStatus(bool typingStatus)
+{
+    _typingStatus = typingStatus;
+    return 0;
+}
+
 // ----------------------------------------------------------------------------
 //  NewMicLevel
 // ----------------------------------------------------------------------------
@ -469,6 +476,7 @@ int32_t AudioDeviceBuffer::DeliverRecordedData()
                                                        totalDelayMS,
                                                        _clockDrift,
                                                        _currentMicLevel,
+                                                        _typingStatus,
                                                        newMicLevel);
    if (res != -1)
    {
--- a/webrtc/modules/audio_device/audio_device_buffer.h
+++ b/webrtc/modules/audio_device/audio_device_buffer.h
@ -67,6 +67,8 @@ public:
        const char fileName[kAdmMaxFileNameSize]);
    int32_t StopOutputFileRecording();

+    int32_t SetTypingStatus(bool typingStatus);
+
    AudioDeviceBuffer();
    ~AudioDeviceBuffer();

@ -110,6 +112,8 @@ private:
    uint32_t                  _currentMicLevel;
    uint32_t                  _newMicLevel;

+    bool                      _typingStatus;
+
    uint32_t                  _playDelayMS;
    uint32_t                  _recDelayMS;

--- a/webrtc/modules/audio_device/include/audio_device_defines.h
+++ b/webrtc/modules/audio_device/include/audio_device_defines.h
@ -62,6 +62,7 @@ public:
                                            const uint32_t totalDelayMS,
                                            const int32_t clockDrift,
                                            const uint32_t currentMicLevel,
+                                            const bool keyPressed,
                                            uint32_t& newMicLevel) = 0;   

    virtual int32_t NeedMorePlayData(const uint32_t nSamples,
--- a/webrtc/modules/audio_device/mac/audio_device_mac.cc
+++ b/webrtc/modules/audio_device/mac/audio_device_mac.cc
@ -13,15 +13,17 @@
 #include "audio_device_config.h"

 #include "event_wrapper.h"
+#include "portaudio/pa_ringbuffer.h"
 #include "trace.h"
 #include "thread_wrapper.h"

+#include <ApplicationServices/ApplicationServices.h>
 #include <cassert>
-
-#include <sys/sysctl.h>         // sysctlbyname()
-#include <mach/mach.h>          // mach_task_self()
 #include <libkern/OSAtomic.h>   // OSAtomicCompareAndSwap()
-#include "portaudio/pa_ringbuffer.h"
+#include <mach/mach.h>          // mach_task_self()
+#include <sys/sysctl.h>         // sysctlbyname()
+
+

 namespace webrtc
 {
@ -3207,6 +3209,8 @@ bool AudioDeviceMac::CaptureWorkerThread()

        _ptrAudioBuffer->SetVQEData(msecOnPlaySide, msecOnRecordSide, 0);

+        _ptrAudioBuffer->SetTypingStatus(KeyPressed());
+
        // deliver recorded samples at specified sample rate, mic level etc.
        // to the observer using callback
        _ptrAudioBuffer->DeliverRecordedData();
@ -3236,4 +3240,14 @@ bool AudioDeviceMac::CaptureWorkerThread()
    return true;
 }

+bool AudioDeviceMac::KeyPressed() const{
+
+  bool key_down = false;
+  // loop through all Mac virtual key constant values
+  for (int key_index = 0; key_index <= 0x5C; key_index++) {
+    key_down |= CGEventSourceKeyState(kCGEventSourceStateHIDSystemState,
+                                      key_index);
+  }
+  return(key_down);
+}
 } //  namespace webrtc
--- a/webrtc/modules/audio_device/mac/audio_device_mac.h
+++ b/webrtc/modules/audio_device/mac/audio_device_mac.h
@ -293,6 +293,9 @@ private:
    bool CaptureWorkerThread();
    bool RenderWorkerThread();

+private:
+    bool KeyPressed() const;
+
 private:
    AudioDeviceBuffer* _ptrAudioBuffer;

--- a/webrtc/modules/audio_device/test/audio_device_test_api.cc
+++ b/webrtc/modules/audio_device/test/audio_device_test_api.cc
@ -92,6 +92,7 @@ class AudioTransportAPI: public AudioTransport {
      const uint32_t totalDelay,
      const int32_t clockSkew,
      const uint32_t currentMicLevel,
+      const bool keyPressed,
      uint32_t& newMicLevel) {
    rec_count_++;
    if (rec_count_ % 100 == 0) {
--- a/webrtc/modules/audio_device/test/func_test_manager.cc
+++ b/webrtc/modules/audio_device/test/func_test_manager.cc
@ -176,6 +176,7 @@ int32_t AudioTransportImpl::RecordedDataIsAvailable(
    const uint32_t totalDelayMS,
    const int32_t clockDrift,
    const uint32_t currentMicLevel,
+    const bool keyPressed,
    uint32_t& newMicLevel)
 {
    if (_fullDuplex && _audioList.GetSize() < 15)
--- a/webrtc/modules/audio_device/test/func_test_manager.h
+++ b/webrtc/modules/audio_device/test/func_test_manager.h
@ -101,6 +101,7 @@ public:
                                const uint32_t totalDelayMS,
                                const int32_t clockDrift,
                                const uint32_t currentMicLevel,
+                                const bool keyPressed,
                                uint32_t& newMicLevel);

    virtual int32_t NeedMorePlayData(const uint32_t nSamples,
--- a/webrtc/modules/audio_device/win/audio_device_core_win.cc
+++ b/webrtc/modules/audio_device/win/audio_device_core_win.cc
@ -4092,6 +4092,8 @@ DWORD AudioDeviceWindowsCore::DoCaptureThread()
                                                    sndCardRecDelay,
                                                    0);

+                        _ptrAudioBuffer->SetTypingStatus(KeyPressed());
+
                        QueryPerformanceCounter(&t1);    // measure time: START

                        _UnLock();  // release lock while making the callback
@ -5145,6 +5147,16 @@ char* AudioDeviceWindowsCore::WideToUTF8(const TCHAR* src) const {
 #endif
 }

+
+bool AudioDeviceWindowsCore::KeyPressed() const{
+
+  int key_down = 0;
+  for (int key = VK_SPACE; key < VK_NUMLOCK; key++) {
+    short res = GetAsyncKeyState(key);
+    key_down |= res & 0x1; // Get the LSB
+  }
+  return (key_down > 0);
+}
 }  // namespace webrtc

 #endif  // WEBRTC_WINDOWS_CORE_AUDIO_BUILD
--- a/webrtc/modules/audio_device/win/audio_device_core_win.h
+++ b/webrtc/modules/audio_device/win/audio_device_core_win.h
@ -210,6 +210,9 @@ public:
 public:
    virtual void AttachAudioBuffer(AudioDeviceBuffer* audioBuffer);

+private:
+    bool KeyPressed() const;
+
 private:    // avrt function pointers
    PAvRevertMmThreadCharacteristics    _PAvRevertMmThreadCharacteristics;
    PAvSetMmThreadCharacteristicsA      _PAvSetMmThreadCharacteristicsA;
--- a/webrtc/modules/audio_device/win/audio_device_wave_win.cc
+++ b/webrtc/modules/audio_device/win/audio_device_wave_win.cc
@ -3359,6 +3359,8 @@ int32_t AudioDeviceWindowsWave::RecProc(LONGLONG& consumedTime)

        _ptrAudioBuffer->SetVQEData(msecOnPlaySide, msecOnRecordSide, drift);

+        _ptrAudioBuffer->SetTypingStatus(KeyPressed());
+
        // Store the play and rec delay values for video synchronization
        _sndCardPlayDelay = msecOnPlaySide;
        _sndCardRecDelay = msecOnRecordSide;
@ -3820,5 +3822,15 @@ int32_t AudioDeviceWindowsWave::RestartTimerIfNeeded(const uint32_t time)
    return 0;
 }

+
+bool AudioDeviceWindowsWave::KeyPressed() const{
+
+  int key_down = 0;
+  for (int key = VK_SPACE; key < VK_NUMLOCK; key++) {
+    short res = GetAsyncKeyState(key);
+    key_down |= res & 0x1; // Get the LSB
+  }
+  return (key_down > 0);
+}
 }  // namespace webrtc

--- a/webrtc/modules/audio_device/win/audio_device_wave_win.h
+++ b/webrtc/modules/audio_device/win/audio_device_wave_win.h
@ -177,6 +177,9 @@ private:
    inline int32_t InputSanityCheckAfterUnlockedPeriod() const;
    inline int32_t OutputSanityCheckAfterUnlockedPeriod() const;

+private:
+    bool KeyPressed() const;
+
 private:
    int32_t EnumeratePlayoutDevices();
    int32_t EnumerateRecordingDevices();
--- a/webrtc/system_wrappers/interface/event_wrapper.h
+++ b/webrtc/system_wrappers/interface/event_wrapper.h
@ -54,12 +54,6 @@ class EventWrapper {

  virtual bool StopTimer() = 0;

-  // Only implemented on Windows
-  // Returns 1 if a key has been pressed since last call to this function.
-  // -1 indicates failure
-  // 0 indicates no key has been pressed since last call
-  // TODO(hellner) this function does not seem to belong here
-  static int KeyPressed();
 };
 } // namespace webrtc

--- a/webrtc/system_wrappers/source/event.cc
+++ b/webrtc/system_wrappers/source/event.cc
@ -30,33 +30,4 @@ EventWrapper* EventWrapper::Create() {
  return EventPosix::Create();
 #endif
 }
-
-int EventWrapper::KeyPressed() {
-#if defined(_WIN32)
-  int key_down = 0;
-  for (int key = 0x20; key < 0x90; key++) {
-    short res = GetAsyncKeyState(key);
-    key_down |= res % 2; // Get the LSB
-  }
-  if (key_down) {
-    return 1;
-  } else {
-    return 0;
-  }
-#elif defined(WEBRTC_MAC) && !defined(WEBRTC_IOS)
-  bool key_down = false;
-  // loop through all Mac virtual key constant values
-  for (int key_index = 0; key_index <= 0x5C; key_index++) {
-    key_down |= CGEventSourceKeyState(kCGEventSourceStateHIDSystemState,
-                                      key_index);
-  }
-  if (key_down) {
-    return 1;
-  } else {
-    return 0;
-  }
-#else
-  return -1;
-#endif
-}
 } // namespace webrtc
--- a/webrtc/voice_engine/transmit_mixer.cc
+++ b/webrtc/voice_engine/transmit_mixer.cc
@ -332,7 +332,8 @@ TransmitMixer::PrepareDemux(const void* audioSamples,
                            const uint32_t samplesPerSec,
                            const uint16_t totalDelayMS,
                            const int32_t clockDrift,
-                            const uint16_t currentMicLevel)
+                            const uint16_t currentMicLevel,
+                            const bool keyPressed)
 {
    WEBRTC_TRACE(kTraceStream, kTraceVoice, VoEId(_instanceId, -1),
                 "TransmitMixer::PrepareDemux(nSamples=%u, nChannels=%u,"
@ -369,7 +370,7 @@ TransmitMixer::PrepareDemux(const void* audioSamples,

    // --- Annoying typing detection (utilizes the APM/VAD decision)
 #ifdef WEBRTC_VOICE_ENGINE_TYPING_DETECTION
-    TypingDetection();
+    TypingDetection(keyPressed);
 #endif

    // --- Mute during DTMF tone if direct feedback is enabled
@ -1327,7 +1328,7 @@ void TransmitMixer::ProcessAudio(int delay_ms, int clock_drift,
 }

 #ifdef WEBRTC_VOICE_ENGINE_TYPING_DETECTION
-int TransmitMixer::TypingDetection()
+int TransmitMixer::TypingDetection(const bool keyPressed)
 {

    // We let the VAD determine if we're using this feature or not.
@ -1336,13 +1337,6 @@ int TransmitMixer::TypingDetection()
        return (0);
    }

-    int keyPressed = EventWrapper::KeyPressed();
-
-    if (keyPressed < 0)
-    {
-        return (-1);
-    }
-
    if (_audioFrame.vad_activity_ == AudioFrame::kVadActive)
        _timeActive++;
    else
--- a/webrtc/voice_engine/transmit_mixer.h
+++ b/webrtc/voice_engine/transmit_mixer.h
@ -56,7 +56,8 @@ public:
                         const uint32_t samplesPerSec,
                         const uint16_t totalDelayMS,
                         const int32_t  clockDrift,
-                         const uint16_t currentMicLevel);
+                         const uint16_t currentMicLevel,
+                         const bool keyPressed);


    int32_t DemuxAndMix();
@ -178,7 +179,7 @@ private:
    void ProcessAudio(int delay_ms, int clock_drift, int current_mic_level);

 #ifdef WEBRTC_VOICE_ENGINE_TYPING_DETECTION
-    int TypingDetection();
+    int TypingDetection(const bool keyPressed);
 #endif

    // uses
--- a/webrtc/voice_engine/voe_base_impl.cc
+++ b/webrtc/voice_engine/voe_base_impl.cc
@ -133,6 +133,7 @@ int32_t VoEBaseImpl::RecordedDataIsAvailable(
        const uint32_t totalDelayMS,
        const int32_t clockDrift,
        const uint32_t currentMicLevel,
+        const bool keyPressed,
        uint32_t& newMicLevel)
 {
    WEBRTC_TRACE(kTraceStream, kTraceVoice, VoEId(_shared->instance_id(), -1),
@ -195,7 +196,7 @@ int32_t VoEBaseImpl::RecordedDataIsAvailable(
    // (APM, mix with file, record to file, mute, etc.)
    _shared->transmit_mixer()->PrepareDemux(audioSamples, nSamples, nChannels,
        samplesPerSec, static_cast<uint16_t>(totalDelayMS), clockDrift,
-        currentVoEMicLevel);
+        currentVoEMicLevel, keyPressed);

    // Copy the audio frame to each sending channel and perform
    // channel-dependent operations (file mixing, mute, etc.) to prepare
--- a/webrtc/voice_engine/voe_base_impl.h
+++ b/webrtc/voice_engine/voe_base_impl.h
@ -80,6 +80,7 @@ public:
                                const uint32_t totalDelayMS,
                                const int32_t clockDrift,
                                const uint32_t currentMicLevel,
+                                const bool keyPressed,
                                uint32_t& newMicLevel);

    virtual int32_t NeedMorePlayData(const uint32_t nSamples,
--- a/webrtc/voice_engine/voe_external_media_impl.cc
+++ b/webrtc/voice_engine/voe_external_media_impl.cc
@ -244,7 +244,8 @@ int VoEExternalMediaImpl::ExternalRecordingInsertData(
            samplingFreqHz,
            totalDelayMS,
            0,
-            0);
+            0,
+            false); // Typing detection not supported

        shared_->transmit_mixer()->DemuxAndMix();
        shared_->transmit_mixer()->EncodeAndSend();