blob: 51ca952008353b950869c733a3b36004f8b929be [file] [log] [blame]
andrew@webrtc.orgb015cbe2012-10-22 18:19:23 +00001/*
2 * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
11// This sub-API supports the following functionalities:
12//
13// - Noise Suppression (NS).
14// - Automatic Gain Control (AGC).
15// - Echo Control (EC).
16// - Receiving side VAD, NS and AGC.
17// - Measurements of instantaneous speech, noise and echo levels.
18// - Generation of AP debug recordings.
19// - Detection of keyboard typing which can disrupt a voice conversation.
20//
21// Usage example, omitting error checking:
22//
23// using namespace webrtc;
24// VoiceEngine* voe = VoiceEngine::Create();
25// VoEBase* base = VoEBase::GetInterface();
26// VoEAudioProcessing* ap = VoEAudioProcessing::GetInterface(voe);
27// base->Init();
28// ap->SetEcStatus(true, kAgcAdaptiveAnalog);
29// ...
30// base->Terminate();
31// base->Release();
32// ap->Release();
33// VoiceEngine::Delete(voe);
34//
35#ifndef WEBRTC_VOICE_ENGINE_VOE_AUDIO_PROCESSING_H
36#define WEBRTC_VOICE_ENGINE_VOE_AUDIO_PROCESSING_H
37
pbos@webrtc.org471ae722013-05-21 13:52:32 +000038#include "webrtc/common_types.h"
andrew@webrtc.orgb015cbe2012-10-22 18:19:23 +000039
40namespace webrtc {
41
42class VoiceEngine;
43
44// VoERxVadCallback
45class WEBRTC_DLLEXPORT VoERxVadCallback
46{
47public:
48 virtual void OnRxVad(int channel, int vadDecision) = 0;
49
50protected:
51 virtual ~VoERxVadCallback() {}
52};
53
54// VoEAudioProcessing
55class WEBRTC_DLLEXPORT VoEAudioProcessing
56{
57public:
58 // Factory for the VoEAudioProcessing sub-API. Increases an internal
59 // reference counter if successful. Returns NULL if the API is not
60 // supported or if construction fails.
61 static VoEAudioProcessing* GetInterface(VoiceEngine* voiceEngine);
62
63 // Releases the VoEAudioProcessing sub-API and decreases an internal
64 // reference counter. Returns the new reference count. This value should
65 // be zero for all sub-API:s before the VoiceEngine object can be safely
66 // deleted.
67 virtual int Release() = 0;
68
69 // Sets Noise Suppression (NS) status and mode.
70 // The NS reduces noise in the microphone signal.
71 virtual int SetNsStatus(bool enable, NsModes mode = kNsUnchanged) = 0;
72
73 // Gets the NS status and mode.
74 virtual int GetNsStatus(bool& enabled, NsModes& mode) = 0;
75
76 // Sets the Automatic Gain Control (AGC) status and mode.
77 // The AGC adjusts the microphone signal to an appropriate level.
78 virtual int SetAgcStatus(bool enable, AgcModes mode = kAgcUnchanged) = 0;
79
80 // Gets the AGC status and mode.
81 virtual int GetAgcStatus(bool& enabled, AgcModes& mode) = 0;
82
83 // Sets the AGC configuration.
84 // Should only be used in situations where the working environment
85 // is well known.
pbos@webrtc.orgca7a9a22013-05-14 08:31:39 +000086 virtual int SetAgcConfig(AgcConfig config) = 0;
andrew@webrtc.orgb015cbe2012-10-22 18:19:23 +000087
88 // Gets the AGC configuration.
89 virtual int GetAgcConfig(AgcConfig& config) = 0;
90
91 // Sets the Echo Control (EC) status and mode.
92 // The EC mitigates acoustic echo where a user can hear their own
93 // speech repeated back due to an acoustic coupling between the
94 // speaker and the microphone at the remote end.
95 virtual int SetEcStatus(bool enable, EcModes mode = kEcUnchanged) = 0;
96
97 // Gets the EC status and mode.
98 virtual int GetEcStatus(bool& enabled, EcModes& mode) = 0;
99
100 // Enables the compensation of clock drift between the capture and render
101 // streams by the echo canceller (i.e. only using EcMode==kEcAec). It will
102 // only be enabled if supported on the current platform; otherwise an error
103 // will be returned. Check if the platform is supported by calling
104 // |DriftCompensationSupported()|.
105 virtual int EnableDriftCompensation(bool enable) = 0;
106 virtual bool DriftCompensationEnabled() = 0;
107 static bool DriftCompensationSupported();
108
109 // Sets a delay |offset| in ms to add to the system delay reported by the
110 // OS, which is used by the AEC to synchronize far- and near-end streams.
111 // In some cases a system may introduce a delay which goes unreported by the
112 // OS, but which is known to the user. This method can be used to compensate
113 // for the unreported delay.
114 virtual void SetDelayOffsetMs(int offset) = 0;
115 virtual int DelayOffsetMs() = 0;
116
117 // Modifies settings for the AEC designed for mobile devices (AECM).
118 virtual int SetAecmMode(AecmModes mode = kAecmSpeakerphone,
119 bool enableCNG = true) = 0;
120
121 // Gets settings for the AECM.
122 virtual int GetAecmMode(AecmModes& mode, bool& enabledCNG) = 0;
123
124 // Enables a high pass filter on the capture signal. This removes DC bias
125 // and low-frequency noise. Recommended to be enabled.
126 virtual int EnableHighPassFilter(bool enable) = 0;
127 virtual bool IsHighPassFilterEnabled() = 0;
128
129 // Sets status and mode of the receiving-side (Rx) NS.
130 // The Rx NS reduces noise in the received signal for the specified
131 // |channel|. Intended for advanced usage only.
132 virtual int SetRxNsStatus(int channel,
133 bool enable,
134 NsModes mode = kNsUnchanged) = 0;
135
136 // Gets status and mode of the receiving-side NS.
137 virtual int GetRxNsStatus(int channel,
138 bool& enabled,
139 NsModes& mode) = 0;
140
141 // Sets status and mode of the receiving-side (Rx) AGC.
142 // The Rx AGC adjusts the received signal to an appropriate level
143 // for the specified |channel|. Intended for advanced usage only.
144 virtual int SetRxAgcStatus(int channel,
145 bool enable,
146 AgcModes mode = kAgcUnchanged) = 0;
147
148 // Gets status and mode of the receiving-side AGC.
149 virtual int GetRxAgcStatus(int channel,
150 bool& enabled,
151 AgcModes& mode) = 0;
152
153 // Modifies the AGC configuration on the receiving side for the
154 // specified |channel|.
pbos@webrtc.orgca7a9a22013-05-14 08:31:39 +0000155 virtual int SetRxAgcConfig(int channel, AgcConfig config) = 0;
andrew@webrtc.orgb015cbe2012-10-22 18:19:23 +0000156
157 // Gets the AGC configuration on the receiving side.
158 virtual int GetRxAgcConfig(int channel, AgcConfig& config) = 0;
159
160 // Registers a VoERxVadCallback |observer| instance and enables Rx VAD
161 // notifications for the specified |channel|.
162 virtual int RegisterRxVadObserver(int channel,
163 VoERxVadCallback &observer) = 0;
164
165 // Deregisters the VoERxVadCallback |observer| and disables Rx VAD
166 // notifications for the specified |channel|.
167 virtual int DeRegisterRxVadObserver(int channel) = 0;
168
169 // Gets the VAD/DTX activity for the specified |channel|.
170 // The returned value is 1 if frames of audio contains speech
171 // and 0 if silence. The output is always 1 if VAD is disabled.
172 virtual int VoiceActivityIndicator(int channel) = 0;
173
174 // Enables or disables the possibility to retrieve echo metrics and delay
175 // logging values during an active call. The metrics are only supported in
176 // AEC.
177 virtual int SetEcMetricsStatus(bool enable) = 0;
178
179 // Gets the current EC metric status.
180 virtual int GetEcMetricsStatus(bool& enabled) = 0;
181
182 // Gets the instantaneous echo level metrics.
183 virtual int GetEchoMetrics(int& ERL, int& ERLE, int& RERL, int& A_NLP) = 0;
184
185 // Gets the EC internal |delay_median| and |delay_std| in ms between
186 // near-end and far-end. The values are calculated over the time period
187 // since the last GetEcDelayMetrics() call.
188 virtual int GetEcDelayMetrics(int& delay_median, int& delay_std) = 0;
189
190 // Enables recording of Audio Processing (AP) debugging information.
191 // The file can later be used for off-line analysis of the AP performance.
192 virtual int StartDebugRecording(const char* fileNameUTF8) = 0;
193
194 // Disables recording of AP debugging information.
195 virtual int StopDebugRecording() = 0;
196
197 // Enables or disables detection of disturbing keyboard typing.
198 // An error notification will be given as a callback upon detection.
199 virtual int SetTypingDetectionStatus(bool enable) = 0;
200
201 // Gets the current typing detection status.
202 virtual int GetTypingDetectionStatus(bool& enabled) = 0;
203
204 // Reports the lower of:
205 // * Time in seconds since the last typing event.
206 // * Time in seconds since the typing detection was enabled.
207 // Returns error if typing detection is disabled.
208 virtual int TimeSinceLastTyping(int &seconds) = 0;
209
210 // Optional setting of typing detection parameters
211 // Parameter with value == 0 will be ignored
212 // and left with default config.
213 // TODO(niklase) Remove default argument as soon as libJingle is updated!
214 virtual int SetTypingDetectionParameters(int timeWindow,
215 int costPerTyping,
216 int reportingThreshold,
217 int penaltyDecay,
218 int typeEventDelay = 0) = 0;
219
220 // Swaps the capture-side left and right audio channels when enabled. It
221 // only has an effect when using a stereo send codec. The setting is
222 // persistent; it will be applied whenever a stereo send codec is enabled.
223 //
224 // The swap is applied only to the captured audio, and not mixed files. The
225 // swap will appear in file recordings and when accessing audio through the
226 // external media interface.
227 virtual void EnableStereoChannelSwapping(bool enable) = 0;
228 virtual bool IsStereoChannelSwappingEnabled() = 0;
229
230protected:
231 VoEAudioProcessing() {}
232 virtual ~VoEAudioProcessing() {}
233};
234
235} // namespace webrtc
236
237#endif // WEBRTC_VOICE_ENGINE_VOE_AUDIO_PROCESSING_H