1 /* 2 * libjingle 3 * Copyright 2004 Google Inc. 4 * 5 * Redistribution and use in source and binary forms, with or without 6 * modification, are permitted provided that the following conditions are met: 7 * 8 * 1. Redistributions of source code must retain the above copyright notice, 9 * this list of conditions and the following disclaimer. 10 * 2. Redistributions in binary form must reproduce the above copyright notice, 11 * this list of conditions and the following disclaimer in the documentation 12 * and/or other materials provided with the distribution. 13 * 3. The name of the author may not be used to endorse or promote products 14 * derived from this software without specific prior written permission. 15 * 16 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR IMPLIED 17 * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF 18 * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO 19 * EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 20 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, 21 * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; 22 * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, 23 * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR 24 * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF 25 * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 26 */ 27 28 #ifdef HAVE_CONFIG_H 29 #include <config.h> 30 #endif 31 32 #ifdef HAVE_WEBRTC_VOICE 33 34 #include "talk/media/webrtc/webrtcvoiceengine.h" 35 36 #include <algorithm> 37 #include <cstdio> 38 #include <string> 39 #include <vector> 40 41 #include "talk/base/base64.h" 42 #include "talk/base/byteorder.h" 43 #include "talk/base/common.h" 44 #include "talk/base/helpers.h" 45 #include "talk/base/logging.h" 46 #include "talk/base/stringencode.h" 47 #include "talk/base/stringutils.h" 48 #include "talk/media/base/audiorenderer.h" 49 #include "talk/media/base/constants.h" 50 #include "talk/media/base/streamparams.h" 51 #include "talk/media/base/voiceprocessor.h" 52 #include "talk/media/webrtc/webrtcvoe.h" 53 #include "webrtc/common.h" 54 #include "webrtc/modules/audio_processing/include/audio_processing.h" 55 56 #ifdef WIN32 57 #include <objbase.h> // NOLINT 58 #endif 59 60 namespace cricket { 61 62 struct CodecPref { 63 const char* name; 64 int clockrate; 65 int channels; 66 int payload_type; 67 bool is_multi_rate; 68 }; 69 70 static const CodecPref kCodecPrefs[] = { 71 { "OPUS", 48000, 2, 111, true }, 72 { "ISAC", 16000, 1, 103, true }, 73 { "ISAC", 32000, 1, 104, true }, 74 { "CELT", 32000, 1, 109, true }, 75 { "CELT", 32000, 2, 110, true }, 76 { "G722", 16000, 1, 9, false }, 77 { "ILBC", 8000, 1, 102, false }, 78 { "PCMU", 8000, 1, 0, false }, 79 { "PCMA", 8000, 1, 8, false }, 80 { "CN", 48000, 1, 107, false }, 81 { "CN", 32000, 1, 106, false }, 82 { "CN", 16000, 1, 105, false }, 83 { "CN", 8000, 1, 13, false }, 84 { "red", 8000, 1, 127, false }, 85 { "telephone-event", 8000, 1, 126, false }, 86 }; 87 88 // For Linux/Mac, using the default device is done by specifying index 0 for 89 // VoE 4.0 and not -1 (which was the case for VoE 3.5). 90 // 91 // On Windows Vista and newer, Microsoft introduced the concept of "Default 92 // Communications Device". This means that there are two types of default 93 // devices (old Wave Audio style default and Default Communications Device). 94 // 95 // On Windows systems which only support Wave Audio style default, uses either 96 // -1 or 0 to select the default device. 97 // 98 // On Windows systems which support both "Default Communication Device" and 99 // old Wave Audio style default, use -1 for Default Communications Device and 100 // -2 for Wave Audio style default, which is what we want to use for clips. 101 // It's not clear yet whether the -2 index is handled properly on other OSes. 102 103 #ifdef WIN32 104 static const int kDefaultAudioDeviceId = -1; 105 static const int kDefaultSoundclipDeviceId = -2; 106 #else 107 static const int kDefaultAudioDeviceId = 0; 108 #endif 109 110 // extension header for audio levels, as defined in 111 // http://tools.ietf.org/html/draft-ietf-avtext-client-to-mixer-audio-level-03 112 static const char kRtpAudioLevelHeaderExtension[] = 113 "urn:ietf:params:rtp-hdrext:ssrc-audio-level"; 114 static const int kRtpAudioLevelHeaderExtensionId = 1; 115 116 static const char kIsacCodecName[] = "ISAC"; 117 static const char kL16CodecName[] = "L16"; 118 // Codec parameters for Opus. 119 static const int kOpusMonoBitrate = 32000; 120 // Parameter used for NACK. 121 // This value is equivalent to 5 seconds of audio data at 20 ms per packet. 122 static const int kNackMaxPackets = 250; 123 static const int kOpusStereoBitrate = 64000; 124 // draft-spittka-payload-rtp-opus-03 125 // Opus bitrate should be in the range between 6000 and 510000. 126 static const int kOpusMinBitrate = 6000; 127 static const int kOpusMaxBitrate = 510000; 128 // Default audio dscp value. 129 // See http://tools.ietf.org/html/rfc2474 for details. 130 // See also http://tools.ietf.org/html/draft-jennings-rtcweb-qos-00 131 static const talk_base::DiffServCodePoint kAudioDscpValue = talk_base::DSCP_EF; 132 133 // Ensure we open the file in a writeable path on ChromeOS and Android. This 134 // workaround can be removed when it's possible to specify a filename for audio 135 // option based AEC dumps. 136 // 137 // TODO(grunell): Use a string in the options instead of hardcoding it here 138 // and let the embedder choose the filename (crbug.com/264223). 139 // 140 // NOTE(ajm): Don't use hardcoded paths on platforms not explicitly specified 141 // below. 142 #if defined(CHROMEOS) 143 static const char kAecDumpByAudioOptionFilename[] = "/tmp/audio.aecdump"; 144 #elif defined(ANDROID) 145 static const char kAecDumpByAudioOptionFilename[] = "/sdcard/audio.aecdump"; 146 #else 147 static const char kAecDumpByAudioOptionFilename[] = "audio.aecdump"; 148 #endif 149 150 // Dumps an AudioCodec in RFC 2327-ish format. 151 static std::string ToString(const AudioCodec& codec) { 152 std::stringstream ss; 153 ss << codec.name << "/" << codec.clockrate << "/" << codec.channels 154 << " (" << codec.id << ")"; 155 return ss.str(); 156 } 157 static std::string ToString(const webrtc::CodecInst& codec) { 158 std::stringstream ss; 159 ss << codec.plname << "/" << codec.plfreq << "/" << codec.channels 160 << " (" << codec.pltype << ")"; 161 return ss.str(); 162 } 163 164 static void LogMultiline(talk_base::LoggingSeverity sev, char* text) { 165 const char* delim = "\r\n"; 166 for (char* tok = strtok(text, delim); tok; tok = strtok(NULL, delim)) { 167 LOG_V(sev) << tok; 168 } 169 } 170 171 // Severity is an integer because it comes is assumed to be from command line. 172 static int SeverityToFilter(int severity) { 173 int filter = webrtc::kTraceNone; 174 switch (severity) { 175 case talk_base::LS_VERBOSE: 176 filter |= webrtc::kTraceAll; 177 case talk_base::LS_INFO: 178 filter |= (webrtc::kTraceStateInfo | webrtc::kTraceInfo); 179 case talk_base::LS_WARNING: 180 filter |= (webrtc::kTraceTerseInfo | webrtc::kTraceWarning); 181 case talk_base::LS_ERROR: 182 filter |= (webrtc::kTraceError | webrtc::kTraceCritical); 183 } 184 return filter; 185 } 186 187 static bool IsCodecMultiRate(const webrtc::CodecInst& codec) { 188 for (size_t i = 0; i < ARRAY_SIZE(kCodecPrefs); ++i) { 189 if (_stricmp(kCodecPrefs[i].name, codec.plname) == 0 && 190 kCodecPrefs[i].clockrate == codec.plfreq) { 191 return kCodecPrefs[i].is_multi_rate; 192 } 193 } 194 return false; 195 } 196 197 static bool FindCodec(const std::vector<AudioCodec>& codecs, 198 const AudioCodec& codec, 199 AudioCodec* found_codec) { 200 for (std::vector<AudioCodec>::const_iterator it = codecs.begin(); 201 it != codecs.end(); ++it) { 202 if (it->Matches(codec)) { 203 if (found_codec != NULL) { 204 *found_codec = *it; 205 } 206 return true; 207 } 208 } 209 return false; 210 } 211 212 static bool IsNackEnabled(const AudioCodec& codec) { 213 return codec.HasFeedbackParam(FeedbackParam(kRtcpFbParamNack, 214 kParamValueEmpty)); 215 } 216 217 // Gets the default set of options applied to the engine. Historically, these 218 // were supplied as a combination of flags from the channel manager (ec, agc, 219 // ns, and highpass) and the rest hardcoded in InitInternal. 220 static AudioOptions GetDefaultEngineOptions() { 221 AudioOptions options; 222 options.echo_cancellation.Set(true); 223 options.auto_gain_control.Set(true); 224 options.noise_suppression.Set(true); 225 options.highpass_filter.Set(true); 226 options.stereo_swapping.Set(false); 227 options.typing_detection.Set(true); 228 options.conference_mode.Set(false); 229 options.adjust_agc_delta.Set(0); 230 options.experimental_agc.Set(false); 231 options.experimental_aec.Set(false); 232 options.aec_dump.Set(false); 233 options.experimental_acm.Set(false); 234 return options; 235 } 236 237 class WebRtcSoundclipMedia : public SoundclipMedia { 238 public: 239 explicit WebRtcSoundclipMedia(WebRtcVoiceEngine *engine) 240 : engine_(engine), webrtc_channel_(-1) { 241 engine_->RegisterSoundclip(this); 242 } 243 244 virtual ~WebRtcSoundclipMedia() { 245 engine_->UnregisterSoundclip(this); 246 if (webrtc_channel_ != -1) { 247 // We shouldn't have to call Disable() here. DeleteChannel() should call 248 // StopPlayout() while deleting the channel. We should fix the bug 249 // inside WebRTC and remove the Disable() call bellow. This work is 250 // tracked by bug http://b/issue?id=5382855. 251 PlaySound(NULL, 0, 0); 252 Disable(); 253 if (engine_->voe_sc()->base()->DeleteChannel(webrtc_channel_) 254 == -1) { 255 LOG_RTCERR1(DeleteChannel, webrtc_channel_); 256 } 257 } 258 } 259 260 bool Init() { 261 if (!engine_->voe_sc()) { 262 return false; 263 } 264 webrtc_channel_ = engine_->CreateSoundclipVoiceChannel(); 265 if (webrtc_channel_ == -1) { 266 LOG_RTCERR0(CreateChannel); 267 return false; 268 } 269 return true; 270 } 271 272 bool Enable() { 273 if (engine_->voe_sc()->base()->StartPlayout(webrtc_channel_) == -1) { 274 LOG_RTCERR1(StartPlayout, webrtc_channel_); 275 return false; 276 } 277 return true; 278 } 279 280 bool Disable() { 281 if (engine_->voe_sc()->base()->StopPlayout(webrtc_channel_) == -1) { 282 LOG_RTCERR1(StopPlayout, webrtc_channel_); 283 return false; 284 } 285 return true; 286 } 287 288 virtual bool PlaySound(const char *buf, int len, int flags) { 289 // The voe file api is not available in chrome. 290 if (!engine_->voe_sc()->file()) { 291 return false; 292 } 293 // Must stop playing the current sound (if any), because we are about to 294 // modify the stream. 295 if (engine_->voe_sc()->file()->StopPlayingFileLocally(webrtc_channel_) 296 == -1) { 297 LOG_RTCERR1(StopPlayingFileLocally, webrtc_channel_); 298 return false; 299 } 300 301 if (buf) { 302 stream_.reset(new WebRtcSoundclipStream(buf, len)); 303 stream_->set_loop((flags & SF_LOOP) != 0); 304 stream_->Rewind(); 305 306 // Play it. 307 if (engine_->voe_sc()->file()->StartPlayingFileLocally( 308 webrtc_channel_, stream_.get()) == -1) { 309 LOG_RTCERR2(StartPlayingFileLocally, webrtc_channel_, stream_.get()); 310 LOG(LS_ERROR) << "Unable to start soundclip"; 311 return false; 312 } 313 } else { 314 stream_.reset(); 315 } 316 return true; 317 } 318 319 int GetLastEngineError() const { return engine_->voe_sc()->error(); } 320 321 private: 322 WebRtcVoiceEngine *engine_; 323 int webrtc_channel_; 324 talk_base::scoped_ptr<WebRtcSoundclipStream> stream_; 325 }; 326 327 WebRtcVoiceEngine::WebRtcVoiceEngine() 328 : voe_wrapper_(new VoEWrapper()), 329 voe_wrapper_sc_(new VoEWrapper()), 330 voe_wrapper_sc_initialized_(false), 331 tracing_(new VoETraceWrapper()), 332 adm_(NULL), 333 adm_sc_(NULL), 334 log_filter_(SeverityToFilter(kDefaultLogSeverity)), 335 is_dumping_aec_(false), 336 desired_local_monitor_enable_(false), 337 use_experimental_acm_(false), 338 tx_processor_ssrc_(0), 339 rx_processor_ssrc_(0) { 340 Construct(); 341 } 342 343 WebRtcVoiceEngine::WebRtcVoiceEngine(VoEWrapper* voe_wrapper, 344 VoEWrapper* voe_wrapper_sc, 345 VoETraceWrapper* tracing) 346 : voe_wrapper_(voe_wrapper), 347 voe_wrapper_sc_(voe_wrapper_sc), 348 voe_wrapper_sc_initialized_(false), 349 tracing_(tracing), 350 adm_(NULL), 351 adm_sc_(NULL), 352 log_filter_(SeverityToFilter(kDefaultLogSeverity)), 353 is_dumping_aec_(false), 354 desired_local_monitor_enable_(false), 355 use_experimental_acm_(false), 356 tx_processor_ssrc_(0), 357 rx_processor_ssrc_(0) { 358 Construct(); 359 } 360 361 void WebRtcVoiceEngine::Construct() { 362 SetTraceFilter(log_filter_); 363 initialized_ = false; 364 LOG(LS_VERBOSE) << "WebRtcVoiceEngine::WebRtcVoiceEngine"; 365 SetTraceOptions(""); 366 if (tracing_->SetTraceCallback(this) == -1) { 367 LOG_RTCERR0(SetTraceCallback); 368 } 369 if (voe_wrapper_->base()->RegisterVoiceEngineObserver(*this) == -1) { 370 LOG_RTCERR0(RegisterVoiceEngineObserver); 371 } 372 // Clear the default agc state. 373 memset(&default_agc_config_, 0, sizeof(default_agc_config_)); 374 375 // Load our audio codec list. 376 ConstructCodecs(); 377 378 // Load our RTP Header extensions. 379 rtp_header_extensions_.push_back( 380 RtpHeaderExtension(kRtpAudioLevelHeaderExtension, 381 kRtpAudioLevelHeaderExtensionId)); 382 options_ = GetDefaultEngineOptions(); 383 384 // Initialize the VoE Configuration to the default ACM. 385 voe_config_.Set<webrtc::AudioCodingModuleFactory>( 386 new webrtc::AudioCodingModuleFactory); 387 } 388 389 static bool IsOpus(const AudioCodec& codec) { 390 return (_stricmp(codec.name.c_str(), kOpusCodecName) == 0); 391 } 392 393 static bool IsIsac(const AudioCodec& codec) { 394 return (_stricmp(codec.name.c_str(), kIsacCodecName) == 0); 395 } 396 397 // True if params["stereo"] == "1" 398 static bool IsOpusStereoEnabled(const AudioCodec& codec) { 399 CodecParameterMap::const_iterator param = 400 codec.params.find(kCodecParamStereo); 401 if (param == codec.params.end()) { 402 return false; 403 } 404 return param->second == kParamValueTrue; 405 } 406 407 static bool IsValidOpusBitrate(int bitrate) { 408 return (bitrate >= kOpusMinBitrate && bitrate <= kOpusMaxBitrate); 409 } 410 411 // Returns 0 if params[kCodecParamMaxAverageBitrate] is not defined or invalid. 412 // Returns the value of params[kCodecParamMaxAverageBitrate] otherwise. 413 static int GetOpusBitrateFromParams(const AudioCodec& codec) { 414 int bitrate = 0; 415 if (!codec.GetParam(kCodecParamMaxAverageBitrate, &bitrate)) { 416 return 0; 417 } 418 if (!IsValidOpusBitrate(bitrate)) { 419 LOG(LS_WARNING) << "Codec parameter \"maxaveragebitrate\" has an " 420 << "invalid value: " << bitrate; 421 return 0; 422 } 423 return bitrate; 424 } 425 426 void WebRtcVoiceEngine::ConstructCodecs() { 427 LOG(LS_INFO) << "WebRtc VoiceEngine codecs:"; 428 int ncodecs = voe_wrapper_->codec()->NumOfCodecs(); 429 for (int i = 0; i < ncodecs; ++i) { 430 webrtc::CodecInst voe_codec; 431 if (voe_wrapper_->codec()->GetCodec(i, voe_codec) != -1) { 432 // Skip uncompressed formats. 433 if (_stricmp(voe_codec.plname, kL16CodecName) == 0) { 434 continue; 435 } 436 437 const CodecPref* pref = NULL; 438 for (size_t j = 0; j < ARRAY_SIZE(kCodecPrefs); ++j) { 439 if (_stricmp(kCodecPrefs[j].name, voe_codec.plname) == 0 && 440 kCodecPrefs[j].clockrate == voe_codec.plfreq && 441 kCodecPrefs[j].channels == voe_codec.channels) { 442 pref = &kCodecPrefs[j]; 443 break; 444 } 445 } 446 447 if (pref) { 448 // Use the payload type that we've configured in our pref table; 449 // use the offset in our pref table to determine the sort order. 450 AudioCodec codec(pref->payload_type, voe_codec.plname, voe_codec.plfreq, 451 voe_codec.rate, voe_codec.channels, 452 ARRAY_SIZE(kCodecPrefs) - (pref - kCodecPrefs)); 453 LOG(LS_INFO) << ToString(codec); 454 if (IsIsac(codec)) { 455 // Indicate auto-bandwidth in signaling. 456 codec.bitrate = 0; 457 } 458 if (IsOpus(codec)) { 459 // Only add fmtp parameters that differ from the spec. 460 if (kPreferredMinPTime != kOpusDefaultMinPTime) { 461 codec.params[kCodecParamMinPTime] = 462 talk_base::ToString(kPreferredMinPTime); 463 } 464 if (kPreferredMaxPTime != kOpusDefaultMaxPTime) { 465 codec.params[kCodecParamMaxPTime] = 466 talk_base::ToString(kPreferredMaxPTime); 467 } 468 // TODO(hellner): Add ptime, sprop-stereo, stereo and useinbandfec 469 // when they can be set to values other than the default. 470 } 471 codecs_.push_back(codec); 472 } else { 473 LOG(LS_WARNING) << "Unexpected codec: " << ToString(voe_codec); 474 } 475 } 476 } 477 // Make sure they are in local preference order. 478 std::sort(codecs_.begin(), codecs_.end(), &AudioCodec::Preferable); 479 } 480 481 WebRtcVoiceEngine::~WebRtcVoiceEngine() { 482 LOG(LS_VERBOSE) << "WebRtcVoiceEngine::~WebRtcVoiceEngine"; 483 if (voe_wrapper_->base()->DeRegisterVoiceEngineObserver() == -1) { 484 LOG_RTCERR0(DeRegisterVoiceEngineObserver); 485 } 486 if (adm_) { 487 voe_wrapper_.reset(); 488 adm_->Release(); 489 adm_ = NULL; 490 } 491 if (adm_sc_) { 492 voe_wrapper_sc_.reset(); 493 adm_sc_->Release(); 494 adm_sc_ = NULL; 495 } 496 497 // Test to see if the media processor was deregistered properly 498 ASSERT(SignalRxMediaFrame.is_empty()); 499 ASSERT(SignalTxMediaFrame.is_empty()); 500 501 tracing_->SetTraceCallback(NULL); 502 } 503 504 bool WebRtcVoiceEngine::Init(talk_base::Thread* worker_thread) { 505 LOG(LS_INFO) << "WebRtcVoiceEngine::Init"; 506 bool res = InitInternal(); 507 if (res) { 508 LOG(LS_INFO) << "WebRtcVoiceEngine::Init Done!"; 509 } else { 510 LOG(LS_ERROR) << "WebRtcVoiceEngine::Init failed"; 511 Terminate(); 512 } 513 return res; 514 } 515 516 bool WebRtcVoiceEngine::InitInternal() { 517 // Temporarily turn logging level up for the Init call 518 int old_filter = log_filter_; 519 int extended_filter = log_filter_ | SeverityToFilter(talk_base::LS_INFO); 520 SetTraceFilter(extended_filter); 521 SetTraceOptions(""); 522 523 // Init WebRtc VoiceEngine. 524 if (voe_wrapper_->base()->Init(adm_) == -1) { 525 LOG_RTCERR0_EX(Init, voe_wrapper_->error()); 526 SetTraceFilter(old_filter); 527 return false; 528 } 529 530 SetTraceFilter(old_filter); 531 SetTraceOptions(log_options_); 532 533 // Log the VoiceEngine version info 534 char buffer[1024] = ""; 535 voe_wrapper_->base()->GetVersion(buffer); 536 LOG(LS_INFO) << "WebRtc VoiceEngine Version:"; 537 LogMultiline(talk_base::LS_INFO, buffer); 538 539 // Save the default AGC configuration settings. This must happen before 540 // calling SetOptions or the default will be overwritten. 541 if (voe_wrapper_->processing()->GetAgcConfig(default_agc_config_) == -1) { 542 LOG_RTCERR0(GetAgcConfig); 543 return false; 544 } 545 546 // Set defaults for options, so that ApplyOptions applies them explicitly 547 // when we clear option (channel) overrides. External clients can still 548 // modify the defaults via SetOptions (on the media engine). 549 if (!SetOptions(GetDefaultEngineOptions())) { 550 return false; 551 } 552 553 // Print our codec list again for the call diagnostic log 554 LOG(LS_INFO) << "WebRtc VoiceEngine codecs:"; 555 for (std::vector<AudioCodec>::const_iterator it = codecs_.begin(); 556 it != codecs_.end(); ++it) { 557 LOG(LS_INFO) << ToString(*it); 558 } 559 560 // Disable the DTMF playout when a tone is sent. 561 // PlayDtmfTone will be used if local playout is needed. 562 if (voe_wrapper_->dtmf()->SetDtmfFeedbackStatus(false) == -1) { 563 LOG_RTCERR1(SetDtmfFeedbackStatus, false); 564 } 565 566 initialized_ = true; 567 return true; 568 } 569 570 bool WebRtcVoiceEngine::EnsureSoundclipEngineInit() { 571 if (voe_wrapper_sc_initialized_) { 572 return true; 573 } 574 // Note that, if initialization fails, voe_wrapper_sc_initialized_ will still 575 // be false, so subsequent calls to EnsureSoundclipEngineInit will 576 // probably just fail again. That's acceptable behavior. 577 #if defined(LINUX) && !defined(HAVE_LIBPULSE) 578 voe_wrapper_sc_->hw()->SetAudioDeviceLayer(webrtc::kAudioLinuxAlsa); 579 #endif 580 581 // Initialize the VoiceEngine instance that we'll use to play out sound clips. 582 if (voe_wrapper_sc_->base()->Init(adm_sc_) == -1) { 583 LOG_RTCERR0_EX(Init, voe_wrapper_sc_->error()); 584 return false; 585 } 586 587 // On Windows, tell it to use the default sound (not communication) devices. 588 // First check whether there is a valid sound device for playback. 589 // TODO(juberti): Clean this up when we support setting the soundclip device. 590 #ifdef WIN32 591 // The SetPlayoutDevice may not be implemented in the case of external ADM. 592 // TODO(ronghuawu): We should only check the adm_sc_ here, but current 593 // PeerConnection interface never set the adm_sc_, so need to check both 594 // in order to determine if the external adm is used. 595 if (!adm_ && !adm_sc_) { 596 int num_of_devices = 0; 597 if (voe_wrapper_sc_->hw()->GetNumOfPlayoutDevices(num_of_devices) != -1 && 598 num_of_devices > 0) { 599 if (voe_wrapper_sc_->hw()->SetPlayoutDevice(kDefaultSoundclipDeviceId) 600 == -1) { 601 LOG_RTCERR1_EX(SetPlayoutDevice, kDefaultSoundclipDeviceId, 602 voe_wrapper_sc_->error()); 603 return false; 604 } 605 } else { 606 LOG(LS_WARNING) << "No valid sound playout device found."; 607 } 608 } 609 #endif 610 voe_wrapper_sc_initialized_ = true; 611 LOG(LS_INFO) << "Initialized WebRtc soundclip engine."; 612 return true; 613 } 614 615 void WebRtcVoiceEngine::Terminate() { 616 LOG(LS_INFO) << "WebRtcVoiceEngine::Terminate"; 617 initialized_ = false; 618 619 StopAecDump(); 620 621 if (voe_wrapper_sc_) { 622 voe_wrapper_sc_initialized_ = false; 623 voe_wrapper_sc_->base()->Terminate(); 624 } 625 voe_wrapper_->base()->Terminate(); 626 desired_local_monitor_enable_ = false; 627 } 628 629 int WebRtcVoiceEngine::GetCapabilities() { 630 return AUDIO_SEND | AUDIO_RECV; 631 } 632 633 VoiceMediaChannel *WebRtcVoiceEngine::CreateChannel() { 634 WebRtcVoiceMediaChannel* ch = new WebRtcVoiceMediaChannel(this); 635 if (!ch->valid()) { 636 delete ch; 637 ch = NULL; 638 } 639 return ch; 640 } 641 642 SoundclipMedia *WebRtcVoiceEngine::CreateSoundclip() { 643 if (!EnsureSoundclipEngineInit()) { 644 LOG(LS_ERROR) << "Unable to create soundclip: soundclip engine failed to " 645 << "initialize."; 646 return NULL; 647 } 648 WebRtcSoundclipMedia *soundclip = new WebRtcSoundclipMedia(this); 649 if (!soundclip->Init() || !soundclip->Enable()) { 650 delete soundclip; 651 return NULL; 652 } 653 return soundclip; 654 } 655 656 bool WebRtcVoiceEngine::SetOptions(const AudioOptions& options) { 657 if (!ApplyOptions(options)) { 658 return false; 659 } 660 options_ = options; 661 return true; 662 } 663 664 bool WebRtcVoiceEngine::SetOptionOverrides(const AudioOptions& overrides) { 665 LOG(LS_INFO) << "Setting option overrides: " << overrides.ToString(); 666 if (!ApplyOptions(overrides)) { 667 return false; 668 } 669 option_overrides_ = overrides; 670 return true; 671 } 672 673 bool WebRtcVoiceEngine::ClearOptionOverrides() { 674 LOG(LS_INFO) << "Clearing option overrides."; 675 AudioOptions options = options_; 676 // Only call ApplyOptions if |options_overrides_| contains overrided options. 677 // ApplyOptions affects NS, AGC other options that is shared between 678 // all WebRtcVoiceEngineChannels. 679 if (option_overrides_ == AudioOptions()) { 680 return true; 681 } 682 683 if (!ApplyOptions(options)) { 684 return false; 685 } 686 option_overrides_ = AudioOptions(); 687 return true; 688 } 689 690 // AudioOptions defaults are set in InitInternal (for options with corresponding 691 // MediaEngineInterface flags) and in SetOptions(int) for flagless options. 692 bool WebRtcVoiceEngine::ApplyOptions(const AudioOptions& options_in) { 693 AudioOptions options = options_in; // The options are modified below. 694 // kEcConference is AEC with high suppression. 695 webrtc::EcModes ec_mode = webrtc::kEcConference; 696 webrtc::AecmModes aecm_mode = webrtc::kAecmSpeakerphone; 697 webrtc::AgcModes agc_mode = webrtc::kAgcAdaptiveAnalog; 698 webrtc::NsModes ns_mode = webrtc::kNsHighSuppression; 699 bool aecm_comfort_noise = false; 700 if (options.aecm_generate_comfort_noise.Get(&aecm_comfort_noise)) { 701 LOG(LS_VERBOSE) << "Comfort noise explicitly set to " 702 << aecm_comfort_noise << " (default is false)."; 703 } 704 705 #if defined(IOS) 706 // On iOS, VPIO provides built-in EC and AGC. 707 options.echo_cancellation.Set(false); 708 options.auto_gain_control.Set(false); 709 #elif defined(ANDROID) 710 ec_mode = webrtc::kEcAecm; 711 #endif 712 713 #if defined(IOS) || defined(ANDROID) 714 // Set the AGC mode for iOS as well despite disabling it above, to avoid 715 // unsupported configuration errors from webrtc. 716 agc_mode = webrtc::kAgcFixedDigital; 717 options.typing_detection.Set(false); 718 options.experimental_agc.Set(false); 719 options.experimental_aec.Set(false); 720 #endif 721 722 LOG(LS_INFO) << "Applying audio options: " << options.ToString(); 723 724 // Configure whether ACM1 or ACM2 is used. 725 bool enable_acm2 = false; 726 if (options.experimental_acm.Get(&enable_acm2)) { 727 EnableExperimentalAcm(enable_acm2); 728 } 729 730 webrtc::VoEAudioProcessing* voep = voe_wrapper_->processing(); 731 732 bool echo_cancellation; 733 if (options.echo_cancellation.Get(&echo_cancellation)) { 734 if (voep->SetEcStatus(echo_cancellation, ec_mode) == -1) { 735 LOG_RTCERR2(SetEcStatus, echo_cancellation, ec_mode); 736 return false; 737 } else { 738 LOG(LS_VERBOSE) << "Echo control set to " << echo_cancellation 739 << " with mode " << ec_mode; 740 } 741 #if !defined(ANDROID) 742 // TODO(ajm): Remove the error return on Android from webrtc. 743 if (voep->SetEcMetricsStatus(echo_cancellation) == -1) { 744 LOG_RTCERR1(SetEcMetricsStatus, echo_cancellation); 745 return false; 746 } 747 #endif 748 if (ec_mode == webrtc::kEcAecm) { 749 if (voep->SetAecmMode(aecm_mode, aecm_comfort_noise) != 0) { 750 LOG_RTCERR2(SetAecmMode, aecm_mode, aecm_comfort_noise); 751 return false; 752 } 753 } 754 } 755 756 bool auto_gain_control; 757 if (options.auto_gain_control.Get(&auto_gain_control)) { 758 if (voep->SetAgcStatus(auto_gain_control, agc_mode) == -1) { 759 LOG_RTCERR2(SetAgcStatus, auto_gain_control, agc_mode); 760 return false; 761 } else { 762 LOG(LS_VERBOSE) << "Auto gain set to " << auto_gain_control 763 << " with mode " << agc_mode; 764 } 765 } 766 767 if (options.tx_agc_target_dbov.IsSet() || 768 options.tx_agc_digital_compression_gain.IsSet() || 769 options.tx_agc_limiter.IsSet()) { 770 // Override default_agc_config_. Generally, an unset option means "leave 771 // the VoE bits alone" in this function, so we want whatever is set to be 772 // stored as the new "default". If we didn't, then setting e.g. 773 // tx_agc_target_dbov would reset digital compression gain and limiter 774 // settings. 775 // Also, if we don't update default_agc_config_, then adjust_agc_delta 776 // would be an offset from the original values, and not whatever was set 777 // explicitly. 778 default_agc_config_.targetLeveldBOv = 779 options.tx_agc_target_dbov.GetWithDefaultIfUnset( 780 default_agc_config_.targetLeveldBOv); 781 default_agc_config_.digitalCompressionGaindB = 782 options.tx_agc_digital_compression_gain.GetWithDefaultIfUnset( 783 default_agc_config_.digitalCompressionGaindB); 784 default_agc_config_.limiterEnable = 785 options.tx_agc_limiter.GetWithDefaultIfUnset( 786 default_agc_config_.limiterEnable); 787 if (voe_wrapper_->processing()->SetAgcConfig(default_agc_config_) == -1) { 788 LOG_RTCERR3(SetAgcConfig, 789 default_agc_config_.targetLeveldBOv, 790 default_agc_config_.digitalCompressionGaindB, 791 default_agc_config_.limiterEnable); 792 return false; 793 } 794 } 795 796 bool noise_suppression; 797 if (options.noise_suppression.Get(&noise_suppression)) { 798 if (voep->SetNsStatus(noise_suppression, ns_mode) == -1) { 799 LOG_RTCERR2(SetNsStatus, noise_suppression, ns_mode); 800 return false; 801 } else { 802 LOG(LS_VERBOSE) << "Noise suppression set to " << noise_suppression 803 << " with mode " << ns_mode; 804 } 805 } 806 807 bool highpass_filter; 808 if (options.highpass_filter.Get(&highpass_filter)) { 809 if (voep->EnableHighPassFilter(highpass_filter) == -1) { 810 LOG_RTCERR1(SetHighpassFilterStatus, highpass_filter); 811 return false; 812 } 813 } 814 815 bool stereo_swapping; 816 if (options.stereo_swapping.Get(&stereo_swapping)) { 817 voep->EnableStereoChannelSwapping(stereo_swapping); 818 if (voep->IsStereoChannelSwappingEnabled() != stereo_swapping) { 819 LOG_RTCERR1(EnableStereoChannelSwapping, stereo_swapping); 820 return false; 821 } 822 } 823 824 bool typing_detection; 825 if (options.typing_detection.Get(&typing_detection)) { 826 if (voep->SetTypingDetectionStatus(typing_detection) == -1) { 827 // In case of error, log the info and continue 828 LOG_RTCERR1(SetTypingDetectionStatus, typing_detection); 829 } 830 } 831 832 int adjust_agc_delta; 833 if (options.adjust_agc_delta.Get(&adjust_agc_delta)) { 834 if (!AdjustAgcLevel(adjust_agc_delta)) { 835 return false; 836 } 837 } 838 839 bool aec_dump; 840 if (options.aec_dump.Get(&aec_dump)) { 841 if (aec_dump) 842 StartAecDump(kAecDumpByAudioOptionFilename); 843 else 844 StopAecDump(); 845 } 846 847 bool experimental_aec; 848 if (options.experimental_aec.Get(&experimental_aec)) { 849 webrtc::AudioProcessing* audioproc = 850 voe_wrapper_->base()->audio_processing(); 851 // We check audioproc for the benefit of tests, since FakeWebRtcVoiceEngine 852 // returns NULL on audio_processing(). 853 if (audioproc) { 854 webrtc::Config config; 855 config.Set<webrtc::DelayCorrection>( 856 new webrtc::DelayCorrection(experimental_aec)); 857 audioproc->SetExtraOptions(config); 858 } 859 } 860 861 uint32 recording_sample_rate; 862 if (options.recording_sample_rate.Get(&recording_sample_rate)) { 863 if (voe_wrapper_->hw()->SetRecordingSampleRate(recording_sample_rate)) { 864 LOG_RTCERR1(SetRecordingSampleRate, recording_sample_rate); 865 } 866 } 867 868 uint32 playout_sample_rate; 869 if (options.playout_sample_rate.Get(&playout_sample_rate)) { 870 if (voe_wrapper_->hw()->SetPlayoutSampleRate(playout_sample_rate)) { 871 LOG_RTCERR1(SetPlayoutSampleRate, playout_sample_rate); 872 } 873 } 874 875 876 return true; 877 } 878 879 bool WebRtcVoiceEngine::SetDelayOffset(int offset) { 880 voe_wrapper_->processing()->SetDelayOffsetMs(offset); 881 if (voe_wrapper_->processing()->DelayOffsetMs() != offset) { 882 LOG_RTCERR1(SetDelayOffsetMs, offset); 883 return false; 884 } 885 886 return true; 887 } 888 889 struct ResumeEntry { 890 ResumeEntry(WebRtcVoiceMediaChannel *c, bool p, SendFlags s) 891 : channel(c), 892 playout(p), 893 send(s) { 894 } 895 896 WebRtcVoiceMediaChannel *channel; 897 bool playout; 898 SendFlags send; 899 }; 900 901 // TODO(juberti): Refactor this so that the core logic can be used to set the 902 // soundclip device. At that time, reinstate the soundclip pause/resume code. 903 bool WebRtcVoiceEngine::SetDevices(const Device* in_device, 904 const Device* out_device) { 905 #if !defined(IOS) 906 int in_id = in_device ? talk_base::FromString<int>(in_device->id) : 907 kDefaultAudioDeviceId; 908 int out_id = out_device ? talk_base::FromString<int>(out_device->id) : 909 kDefaultAudioDeviceId; 910 // The device manager uses -1 as the default device, which was the case for 911 // VoE 3.5. VoE 4.0, however, uses 0 as the default in Linux and Mac. 912 #ifndef WIN32 913 if (-1 == in_id) { 914 in_id = kDefaultAudioDeviceId; 915 } 916 if (-1 == out_id) { 917 out_id = kDefaultAudioDeviceId; 918 } 919 #endif 920 921 std::string in_name = (in_id != kDefaultAudioDeviceId) ? 922 in_device->name : "Default device"; 923 std::string out_name = (out_id != kDefaultAudioDeviceId) ? 924 out_device->name : "Default device"; 925 LOG(LS_INFO) << "Setting microphone to (id=" << in_id << ", name=" << in_name 926 << ") and speaker to (id=" << out_id << ", name=" << out_name 927 << ")"; 928 929 // If we're running the local monitor, we need to stop it first. 930 bool ret = true; 931 if (!PauseLocalMonitor()) { 932 LOG(LS_WARNING) << "Failed to pause local monitor"; 933 ret = false; 934 } 935 936 // Must also pause all audio playback and capture. 937 for (ChannelList::const_iterator i = channels_.begin(); 938 i != channels_.end(); ++i) { 939 WebRtcVoiceMediaChannel *channel = *i; 940 if (!channel->PausePlayout()) { 941 LOG(LS_WARNING) << "Failed to pause playout"; 942 ret = false; 943 } 944 if (!channel->PauseSend()) { 945 LOG(LS_WARNING) << "Failed to pause send"; 946 ret = false; 947 } 948 } 949 950 // Find the recording device id in VoiceEngine and set recording device. 951 if (!FindWebRtcAudioDeviceId(true, in_name, in_id, &in_id)) { 952 ret = false; 953 } 954 if (ret) { 955 if (voe_wrapper_->hw()->SetRecordingDevice(in_id) == -1) { 956 LOG_RTCERR2(SetRecordingDevice, in_name, in_id); 957 ret = false; 958 } 959 } 960 961 // Find the playout device id in VoiceEngine and set playout device. 962 if (!FindWebRtcAudioDeviceId(false, out_name, out_id, &out_id)) { 963 LOG(LS_WARNING) << "Failed to find VoiceEngine device id for " << out_name; 964 ret = false; 965 } 966 if (ret) { 967 if (voe_wrapper_->hw()->SetPlayoutDevice(out_id) == -1) { 968 LOG_RTCERR2(SetPlayoutDevice, out_name, out_id); 969 ret = false; 970 } 971 } 972 973 // Resume all audio playback and capture. 974 for (ChannelList::const_iterator i = channels_.begin(); 975 i != channels_.end(); ++i) { 976 WebRtcVoiceMediaChannel *channel = *i; 977 if (!channel->ResumePlayout()) { 978 LOG(LS_WARNING) << "Failed to resume playout"; 979 ret = false; 980 } 981 if (!channel->ResumeSend()) { 982 LOG(LS_WARNING) << "Failed to resume send"; 983 ret = false; 984 } 985 } 986 987 // Resume local monitor. 988 if (!ResumeLocalMonitor()) { 989 LOG(LS_WARNING) << "Failed to resume local monitor"; 990 ret = false; 991 } 992 993 if (ret) { 994 LOG(LS_INFO) << "Set microphone to (id=" << in_id <<" name=" << in_name 995 << ") and speaker to (id="<< out_id << " name=" << out_name 996 << ")"; 997 } 998 999 return ret; 1000 #else 1001 return true; 1002 #endif // !IOS 1003 } 1004 1005 bool WebRtcVoiceEngine::FindWebRtcAudioDeviceId( 1006 bool is_input, const std::string& dev_name, int dev_id, int* rtc_id) { 1007 // In Linux, VoiceEngine uses the same device dev_id as the device manager. 1008 #if defined(LINUX) || defined(ANDROID) 1009 *rtc_id = dev_id; 1010 return true; 1011 #else 1012 // In Windows and Mac, we need to find the VoiceEngine device id by name 1013 // unless the input dev_id is the default device id. 1014 if (kDefaultAudioDeviceId == dev_id) { 1015 *rtc_id = dev_id; 1016 return true; 1017 } 1018 1019 // Get the number of VoiceEngine audio devices. 1020 int count = 0; 1021 if (is_input) { 1022 if (-1 == voe_wrapper_->hw()->GetNumOfRecordingDevices(count)) { 1023 LOG_RTCERR0(GetNumOfRecordingDevices); 1024 return false; 1025 } 1026 } else { 1027 if (-1 == voe_wrapper_->hw()->GetNumOfPlayoutDevices(count)) { 1028 LOG_RTCERR0(GetNumOfPlayoutDevices); 1029 return false; 1030 } 1031 } 1032 1033 for (int i = 0; i < count; ++i) { 1034 char name[128]; 1035 char guid[128]; 1036 if (is_input) { 1037 voe_wrapper_->hw()->GetRecordingDeviceName(i, name, guid); 1038 LOG(LS_VERBOSE) << "VoiceEngine microphone " << i << ": " << name; 1039 } else { 1040 voe_wrapper_->hw()->GetPlayoutDeviceName(i, name, guid); 1041 LOG(LS_VERBOSE) << "VoiceEngine speaker " << i << ": " << name; 1042 } 1043 1044 std::string webrtc_name(name); 1045 if (dev_name.compare(0, webrtc_name.size(), webrtc_name) == 0) { 1046 *rtc_id = i; 1047 return true; 1048 } 1049 } 1050 LOG(LS_WARNING) << "VoiceEngine cannot find device: " << dev_name; 1051 return false; 1052 #endif 1053 } 1054 1055 bool WebRtcVoiceEngine::GetOutputVolume(int* level) { 1056 unsigned int ulevel; 1057 if (voe_wrapper_->volume()->GetSpeakerVolume(ulevel) == -1) { 1058 LOG_RTCERR1(GetSpeakerVolume, level); 1059 return false; 1060 } 1061 *level = ulevel; 1062 return true; 1063 } 1064 1065 bool WebRtcVoiceEngine::SetOutputVolume(int level) { 1066 ASSERT(level >= 0 && level <= 255); 1067 if (voe_wrapper_->volume()->SetSpeakerVolume(level) == -1) { 1068 LOG_RTCERR1(SetSpeakerVolume, level); 1069 return false; 1070 } 1071 return true; 1072 } 1073 1074 int WebRtcVoiceEngine::GetInputLevel() { 1075 unsigned int ulevel; 1076 return (voe_wrapper_->volume()->GetSpeechInputLevel(ulevel) != -1) ? 1077 static_cast<int>(ulevel) : -1; 1078 } 1079 1080 bool WebRtcVoiceEngine::SetLocalMonitor(bool enable) { 1081 desired_local_monitor_enable_ = enable; 1082 return ChangeLocalMonitor(desired_local_monitor_enable_); 1083 } 1084 1085 bool WebRtcVoiceEngine::ChangeLocalMonitor(bool enable) { 1086 // The voe file api is not available in chrome. 1087 if (!voe_wrapper_->file()) { 1088 return false; 1089 } 1090 if (enable && !monitor_) { 1091 monitor_.reset(new WebRtcMonitorStream); 1092 if (voe_wrapper_->file()->StartRecordingMicrophone(monitor_.get()) == -1) { 1093 LOG_RTCERR1(StartRecordingMicrophone, monitor_.get()); 1094 // Must call Stop() because there are some cases where Start will report 1095 // failure but still change the state, and if we leave VE in the on state 1096 // then it could crash later when trying to invoke methods on our monitor. 1097 voe_wrapper_->file()->StopRecordingMicrophone(); 1098 monitor_.reset(); 1099 return false; 1100 } 1101 } else if (!enable && monitor_) { 1102 voe_wrapper_->file()->StopRecordingMicrophone(); 1103 monitor_.reset(); 1104 } 1105 return true; 1106 } 1107 1108 bool WebRtcVoiceEngine::PauseLocalMonitor() { 1109 return ChangeLocalMonitor(false); 1110 } 1111 1112 bool WebRtcVoiceEngine::ResumeLocalMonitor() { 1113 return ChangeLocalMonitor(desired_local_monitor_enable_); 1114 } 1115 1116 const std::vector<AudioCodec>& WebRtcVoiceEngine::codecs() { 1117 return codecs_; 1118 } 1119 1120 bool WebRtcVoiceEngine::FindCodec(const AudioCodec& in) { 1121 return FindWebRtcCodec(in, NULL); 1122 } 1123 1124 // Get the VoiceEngine codec that matches |in|, with the supplied settings. 1125 bool WebRtcVoiceEngine::FindWebRtcCodec(const AudioCodec& in, 1126 webrtc::CodecInst* out) { 1127 int ncodecs = voe_wrapper_->codec()->NumOfCodecs(); 1128 for (int i = 0; i < ncodecs; ++i) { 1129 webrtc::CodecInst voe_codec; 1130 if (voe_wrapper_->codec()->GetCodec(i, voe_codec) != -1) { 1131 AudioCodec codec(voe_codec.pltype, voe_codec.plname, voe_codec.plfreq, 1132 voe_codec.rate, voe_codec.channels, 0); 1133 bool multi_rate = IsCodecMultiRate(voe_codec); 1134 // Allow arbitrary rates for ISAC to be specified. 1135 if (multi_rate) { 1136 // Set codec.bitrate to 0 so the check for codec.Matches() passes. 1137 codec.bitrate = 0; 1138 } 1139 if (codec.Matches(in)) { 1140 if (out) { 1141 // Fixup the payload type. 1142 voe_codec.pltype = in.id; 1143 1144 // Set bitrate if specified. 1145 if (multi_rate && in.bitrate != 0) { 1146 voe_codec.rate = in.bitrate; 1147 } 1148 1149 // Apply codec-specific settings. 1150 if (IsIsac(codec)) { 1151 // If ISAC and an explicit bitrate is not specified, 1152 // enable auto bandwidth adjustment. 1153 voe_codec.rate = (in.bitrate > 0) ? in.bitrate : -1; 1154 } 1155 *out = voe_codec; 1156 } 1157 return true; 1158 } 1159 } 1160 } 1161 return false; 1162 } 1163 const std::vector<RtpHeaderExtension>& 1164 WebRtcVoiceEngine::rtp_header_extensions() const { 1165 return rtp_header_extensions_; 1166 } 1167 1168 void WebRtcVoiceEngine::SetLogging(int min_sev, const char* filter) { 1169 // if min_sev == -1, we keep the current log level. 1170 if (min_sev >= 0) { 1171 SetTraceFilter(SeverityToFilter(min_sev)); 1172 } 1173 log_options_ = filter; 1174 SetTraceOptions(initialized_ ? log_options_ : ""); 1175 } 1176 1177 int WebRtcVoiceEngine::GetLastEngineError() { 1178 return voe_wrapper_->error(); 1179 } 1180 1181 void WebRtcVoiceEngine::SetTraceFilter(int filter) { 1182 log_filter_ = filter; 1183 tracing_->SetTraceFilter(filter); 1184 } 1185 1186 // We suppport three different logging settings for VoiceEngine: 1187 // 1. Observer callback that goes into talk diagnostic logfile. 1188 // Use --logfile and --loglevel 1189 // 1190 // 2. Encrypted VoiceEngine log for debugging VoiceEngine. 1191 // Use --voice_loglevel --voice_logfilter "tracefile file_name" 1192 // 1193 // 3. EC log and dump for debugging QualityEngine. 1194 // Use --voice_loglevel --voice_logfilter "recordEC file_name" 1195 // 1196 // For more details see: "https://sites.google.com/a/google.com/wavelet/Home/ 1197 // Magic-Flute--RTC-Engine-/Magic-Flute-Command-Line-Parameters" 1198 void WebRtcVoiceEngine::SetTraceOptions(const std::string& options) { 1199 // Set encrypted trace file. 1200 std::vector<std::string> opts; 1201 talk_base::tokenize(options, ' ', '"', '"', &opts); 1202 std::vector<std::string>::iterator tracefile = 1203 std::find(opts.begin(), opts.end(), "tracefile"); 1204 if (tracefile != opts.end() && ++tracefile != opts.end()) { 1205 // Write encrypted debug output (at same loglevel) to file 1206 // EncryptedTraceFile no longer supported. 1207 if (tracing_->SetTraceFile(tracefile->c_str()) == -1) { 1208 LOG_RTCERR1(SetTraceFile, *tracefile); 1209 } 1210 } 1211 1212 // Allow trace options to override the trace filter. We default 1213 // it to log_filter_ (as a translation of libjingle log levels) 1214 // elsewhere, but this allows clients to explicitly set webrtc 1215 // log levels. 1216 std::vector<std::string>::iterator tracefilter = 1217 std::find(opts.begin(), opts.end(), "tracefilter"); 1218 if (tracefilter != opts.end() && ++tracefilter != opts.end()) { 1219 if (!tracing_->SetTraceFilter(talk_base::FromString<int>(*tracefilter))) { 1220 LOG_RTCERR1(SetTraceFilter, *tracefilter); 1221 } 1222 } 1223 1224 // Set AEC dump file 1225 std::vector<std::string>::iterator recordEC = 1226 std::find(opts.begin(), opts.end(), "recordEC"); 1227 if (recordEC != opts.end()) { 1228 ++recordEC; 1229 if (recordEC != opts.end()) 1230 StartAecDump(recordEC->c_str()); 1231 else 1232 StopAecDump(); 1233 } 1234 } 1235 1236 // Ignore spammy trace messages, mostly from the stats API when we haven't 1237 // gotten RTCP info yet from the remote side. 1238 bool WebRtcVoiceEngine::ShouldIgnoreTrace(const std::string& trace) { 1239 static const char* kTracesToIgnore[] = { 1240 "\tfailed to GetReportBlockInformation", 1241 "GetRecCodec() failed to get received codec", 1242 "GetReceivedRtcpStatistics: Could not get received RTP statistics", 1243 "GetRemoteRTCPData() failed to measure statistics due to lack of received RTP and/or RTCP packets", // NOLINT 1244 "GetRemoteRTCPData() failed to retrieve sender info for remote side", 1245 "GetRTPStatistics() failed to measure RTT since no RTP packets have been received yet", // NOLINT 1246 "GetRTPStatistics() failed to read RTP statistics from the RTP/RTCP module", 1247 "GetRTPStatistics() failed to retrieve RTT from the RTP/RTCP module", 1248 "SenderInfoReceived No received SR", 1249 "StatisticsRTP() no statistics available", 1250 "TransmitMixer::TypingDetection() VE_TYPING_NOISE_WARNING message has been posted", // NOLINT 1251 "TransmitMixer::TypingDetection() pending noise-saturation warning exists", // NOLINT 1252 "GetRecPayloadType() failed to retrieve RX payload type (error=10026)", // NOLINT 1253 "StopPlayingFileAsMicrophone() isnot playing (error=8088)", 1254 NULL 1255 }; 1256 for (const char* const* p = kTracesToIgnore; *p; ++p) { 1257 if (trace.find(*p) != std::string::npos) { 1258 return true; 1259 } 1260 } 1261 return false; 1262 } 1263 1264 void WebRtcVoiceEngine::EnableExperimentalAcm(bool enable) { 1265 if (enable == use_experimental_acm_) 1266 return; 1267 if (enable) { 1268 LOG(LS_INFO) << "VoiceEngine is set to use new ACM (ACM2 + NetEq4)."; 1269 voe_config_.Set<webrtc::AudioCodingModuleFactory>( 1270 new webrtc::NewAudioCodingModuleFactory()); 1271 } else { 1272 LOG(LS_INFO) << "VoiceEngine is set to use legacy ACM (ACM1 + Neteq3)."; 1273 voe_config_.Set<webrtc::AudioCodingModuleFactory>( 1274 new webrtc::AudioCodingModuleFactory()); 1275 } 1276 use_experimental_acm_ = enable; 1277 } 1278 1279 void WebRtcVoiceEngine::Print(webrtc::TraceLevel level, const char* trace, 1280 int length) { 1281 talk_base::LoggingSeverity sev = talk_base::LS_VERBOSE; 1282 if (level == webrtc::kTraceError || level == webrtc::kTraceCritical) 1283 sev = talk_base::LS_ERROR; 1284 else if (level == webrtc::kTraceWarning) 1285 sev = talk_base::LS_WARNING; 1286 else if (level == webrtc::kTraceStateInfo || level == webrtc::kTraceInfo) 1287 sev = talk_base::LS_INFO; 1288 else if (level == webrtc::kTraceTerseInfo) 1289 sev = talk_base::LS_INFO; 1290 1291 // Skip past boilerplate prefix text 1292 if (length < 72) { 1293 std::string msg(trace, length); 1294 LOG(LS_ERROR) << "Malformed webrtc log message: "; 1295 LOG_V(sev) << msg; 1296 } else { 1297 std::string msg(trace + 71, length - 72); 1298 if (!ShouldIgnoreTrace(msg)) { 1299 LOG_V(sev) << "webrtc: " << msg; 1300 } 1301 } 1302 } 1303 1304 void WebRtcVoiceEngine::CallbackOnError(int channel_num, int err_code) { 1305 talk_base::CritScope lock(&channels_cs_); 1306 WebRtcVoiceMediaChannel* channel = NULL; 1307 uint32 ssrc = 0; 1308 LOG(LS_WARNING) << "VoiceEngine error " << err_code << " reported on channel " 1309 << channel_num << "."; 1310 if (FindChannelAndSsrc(channel_num, &channel, &ssrc)) { 1311 ASSERT(channel != NULL); 1312 channel->OnError(ssrc, err_code); 1313 } else { 1314 LOG(LS_ERROR) << "VoiceEngine channel " << channel_num 1315 << " could not be found in channel list when error reported."; 1316 } 1317 } 1318 1319 bool WebRtcVoiceEngine::FindChannelAndSsrc( 1320 int channel_num, WebRtcVoiceMediaChannel** channel, uint32* ssrc) const { 1321 ASSERT(channel != NULL && ssrc != NULL); 1322 1323 *channel = NULL; 1324 *ssrc = 0; 1325 // Find corresponding channel and ssrc 1326 for (ChannelList::const_iterator it = channels_.begin(); 1327 it != channels_.end(); ++it) { 1328 ASSERT(*it != NULL); 1329 if ((*it)->FindSsrc(channel_num, ssrc)) { 1330 *channel = *it; 1331 return true; 1332 } 1333 } 1334 1335 return false; 1336 } 1337 1338 // This method will search through the WebRtcVoiceMediaChannels and 1339 // obtain the voice engine's channel number. 1340 bool WebRtcVoiceEngine::FindChannelNumFromSsrc( 1341 uint32 ssrc, MediaProcessorDirection direction, int* channel_num) { 1342 ASSERT(channel_num != NULL); 1343 ASSERT(direction == MPD_RX || direction == MPD_TX); 1344 1345 *channel_num = -1; 1346 // Find corresponding channel for ssrc. 1347 for (ChannelList::const_iterator it = channels_.begin(); 1348 it != channels_.end(); ++it) { 1349 ASSERT(*it != NULL); 1350 if (direction & MPD_RX) { 1351 *channel_num = (*it)->GetReceiveChannelNum(ssrc); 1352 } 1353 if (*channel_num == -1 && (direction & MPD_TX)) { 1354 *channel_num = (*it)->GetSendChannelNum(ssrc); 1355 } 1356 if (*channel_num != -1) { 1357 return true; 1358 } 1359 } 1360 LOG(LS_WARNING) << "FindChannelFromSsrc. No Channel Found for Ssrc: " << ssrc; 1361 return false; 1362 } 1363 1364 void WebRtcVoiceEngine::RegisterChannel(WebRtcVoiceMediaChannel *channel) { 1365 talk_base::CritScope lock(&channels_cs_); 1366 channels_.push_back(channel); 1367 } 1368 1369 void WebRtcVoiceEngine::UnregisterChannel(WebRtcVoiceMediaChannel *channel) { 1370 talk_base::CritScope lock(&channels_cs_); 1371 ChannelList::iterator i = std::find(channels_.begin(), 1372 channels_.end(), 1373 channel); 1374 if (i != channels_.end()) { 1375 channels_.erase(i); 1376 } 1377 } 1378 1379 void WebRtcVoiceEngine::RegisterSoundclip(WebRtcSoundclipMedia *soundclip) { 1380 soundclips_.push_back(soundclip); 1381 } 1382 1383 void WebRtcVoiceEngine::UnregisterSoundclip(WebRtcSoundclipMedia *soundclip) { 1384 SoundclipList::iterator i = std::find(soundclips_.begin(), 1385 soundclips_.end(), 1386 soundclip); 1387 if (i != soundclips_.end()) { 1388 soundclips_.erase(i); 1389 } 1390 } 1391 1392 // Adjusts the default AGC target level by the specified delta. 1393 // NB: If we start messing with other config fields, we'll want 1394 // to save the current webrtc::AgcConfig as well. 1395 bool WebRtcVoiceEngine::AdjustAgcLevel(int delta) { 1396 webrtc::AgcConfig config = default_agc_config_; 1397 config.targetLeveldBOv -= delta; 1398 1399 LOG(LS_INFO) << "Adjusting AGC level from default -" 1400 << default_agc_config_.targetLeveldBOv << "dB to -" 1401 << config.targetLeveldBOv << "dB"; 1402 1403 if (voe_wrapper_->processing()->SetAgcConfig(config) == -1) { 1404 LOG_RTCERR1(SetAgcConfig, config.targetLeveldBOv); 1405 return false; 1406 } 1407 return true; 1408 } 1409 1410 bool WebRtcVoiceEngine::SetAudioDeviceModule(webrtc::AudioDeviceModule* adm, 1411 webrtc::AudioDeviceModule* adm_sc) { 1412 if (initialized_) { 1413 LOG(LS_WARNING) << "SetAudioDeviceModule can not be called after Init."; 1414 return false; 1415 } 1416 if (adm_) { 1417 adm_->Release(); 1418 adm_ = NULL; 1419 } 1420 if (adm) { 1421 adm_ = adm; 1422 adm_->AddRef(); 1423 } 1424 1425 if (adm_sc_) { 1426 adm_sc_->Release(); 1427 adm_sc_ = NULL; 1428 } 1429 if (adm_sc) { 1430 adm_sc_ = adm_sc; 1431 adm_sc_->AddRef(); 1432 } 1433 return true; 1434 } 1435 1436 bool WebRtcVoiceEngine::RegisterProcessor( 1437 uint32 ssrc, 1438 VoiceProcessor* voice_processor, 1439 MediaProcessorDirection direction) { 1440 bool register_with_webrtc = false; 1441 int channel_id = -1; 1442 bool success = false; 1443 uint32* processor_ssrc = NULL; 1444 bool found_channel = FindChannelNumFromSsrc(ssrc, direction, &channel_id); 1445 if (voice_processor == NULL || !found_channel) { 1446 LOG(LS_WARNING) << "Media Processing Registration Failed. ssrc: " << ssrc 1447 << " foundChannel: " << found_channel; 1448 return false; 1449 } 1450 1451 webrtc::ProcessingTypes processing_type; 1452 { 1453 talk_base::CritScope cs(&signal_media_critical_); 1454 if (direction == MPD_RX) { 1455 processing_type = webrtc::kPlaybackAllChannelsMixed; 1456 if (SignalRxMediaFrame.is_empty()) { 1457 register_with_webrtc = true; 1458 processor_ssrc = &rx_processor_ssrc_; 1459 } 1460 SignalRxMediaFrame.connect(voice_processor, 1461 &VoiceProcessor::OnFrame); 1462 } else { 1463 processing_type = webrtc::kRecordingPerChannel; 1464 if (SignalTxMediaFrame.is_empty()) { 1465 register_with_webrtc = true; 1466 processor_ssrc = &tx_processor_ssrc_; 1467 } 1468 SignalTxMediaFrame.connect(voice_processor, 1469 &VoiceProcessor::OnFrame); 1470 } 1471 } 1472 if (register_with_webrtc) { 1473 // TODO(janahan): when registering consider instantiating a 1474 // a VoeMediaProcess object and not make the engine extend the interface. 1475 if (voe()->media() && voe()->media()-> 1476 RegisterExternalMediaProcessing(channel_id, 1477 processing_type, 1478 *this) != -1) { 1479 LOG(LS_INFO) << "Media Processing Registration Succeeded. channel:" 1480 << channel_id; 1481 *processor_ssrc = ssrc; 1482 success = true; 1483 } else { 1484 LOG_RTCERR2(RegisterExternalMediaProcessing, 1485 channel_id, 1486 processing_type); 1487 success = false; 1488 } 1489 } else { 1490 // If we don't have to register with the engine, we just needed to 1491 // connect a new processor, set success to true; 1492 success = true; 1493 } 1494 return success; 1495 } 1496 1497 bool WebRtcVoiceEngine::UnregisterProcessorChannel( 1498 MediaProcessorDirection channel_direction, 1499 uint32 ssrc, 1500 VoiceProcessor* voice_processor, 1501 MediaProcessorDirection processor_direction) { 1502 bool success = true; 1503 FrameSignal* signal; 1504 webrtc::ProcessingTypes processing_type; 1505 uint32* processor_ssrc = NULL; 1506 if (channel_direction == MPD_RX) { 1507 signal = &SignalRxMediaFrame; 1508 processing_type = webrtc::kPlaybackAllChannelsMixed; 1509 processor_ssrc = &rx_processor_ssrc_; 1510 } else { 1511 signal = &SignalTxMediaFrame; 1512 processing_type = webrtc::kRecordingPerChannel; 1513 processor_ssrc = &tx_processor_ssrc_; 1514 } 1515 1516 int deregister_id = -1; 1517 { 1518 talk_base::CritScope cs(&signal_media_critical_); 1519 if ((processor_direction & channel_direction) != 0 && !signal->is_empty()) { 1520 signal->disconnect(voice_processor); 1521 int channel_id = -1; 1522 bool found_channel = FindChannelNumFromSsrc(ssrc, 1523 channel_direction, 1524 &channel_id); 1525 if (signal->is_empty() && found_channel) { 1526 deregister_id = channel_id; 1527 } 1528 } 1529 } 1530 if (deregister_id != -1) { 1531 if (voe()->media() && 1532 voe()->media()->DeRegisterExternalMediaProcessing(deregister_id, 1533 processing_type) != -1) { 1534 *processor_ssrc = 0; 1535 LOG(LS_INFO) << "Media Processing DeRegistration Succeeded. channel:" 1536 << deregister_id; 1537 } else { 1538 LOG_RTCERR2(DeRegisterExternalMediaProcessing, 1539 deregister_id, 1540 processing_type); 1541 success = false; 1542 } 1543 } 1544 return success; 1545 } 1546 1547 bool WebRtcVoiceEngine::UnregisterProcessor( 1548 uint32 ssrc, 1549 VoiceProcessor* voice_processor, 1550 MediaProcessorDirection direction) { 1551 bool success = true; 1552 if (voice_processor == NULL) { 1553 LOG(LS_WARNING) << "Media Processing Deregistration Failed. ssrc: " 1554 << ssrc; 1555 return false; 1556 } 1557 if (!UnregisterProcessorChannel(MPD_RX, ssrc, voice_processor, direction)) { 1558 success = false; 1559 } 1560 if (!UnregisterProcessorChannel(MPD_TX, ssrc, voice_processor, direction)) { 1561 success = false; 1562 } 1563 return success; 1564 } 1565 1566 // Implementing method from WebRtc VoEMediaProcess interface 1567 // Do not lock mux_channel_cs_ in this callback. 1568 void WebRtcVoiceEngine::Process(int channel, 1569 webrtc::ProcessingTypes type, 1570 int16_t audio10ms[], 1571 int length, 1572 int sampling_freq, 1573 bool is_stereo) { 1574 talk_base::CritScope cs(&signal_media_critical_); 1575 AudioFrame frame(audio10ms, length, sampling_freq, is_stereo); 1576 if (type == webrtc::kPlaybackAllChannelsMixed) { 1577 SignalRxMediaFrame(rx_processor_ssrc_, MPD_RX, &frame); 1578 } else if (type == webrtc::kRecordingPerChannel) { 1579 SignalTxMediaFrame(tx_processor_ssrc_, MPD_TX, &frame); 1580 } else { 1581 LOG(LS_WARNING) << "Media Processing invoked unexpectedly." 1582 << " channel: " << channel << " type: " << type 1583 << " tx_ssrc: " << tx_processor_ssrc_ 1584 << " rx_ssrc: " << rx_processor_ssrc_; 1585 } 1586 } 1587 1588 void WebRtcVoiceEngine::StartAecDump(const std::string& filename) { 1589 if (!is_dumping_aec_) { 1590 // Start dumping AEC when we are not dumping. 1591 if (voe_wrapper_->processing()->StartDebugRecording( 1592 filename.c_str()) != webrtc::AudioProcessing::kNoError) { 1593 LOG_RTCERR0(StartDebugRecording); 1594 } else { 1595 is_dumping_aec_ = true; 1596 } 1597 } 1598 } 1599 1600 void WebRtcVoiceEngine::StopAecDump() { 1601 if (is_dumping_aec_) { 1602 // Stop dumping AEC when we are dumping. 1603 if (voe_wrapper_->processing()->StopDebugRecording() != 1604 webrtc::AudioProcessing::kNoError) { 1605 LOG_RTCERR0(StopDebugRecording); 1606 } 1607 is_dumping_aec_ = false; 1608 } 1609 } 1610 1611 int WebRtcVoiceEngine::CreateVoiceChannel(VoEWrapper* voice_engine_wrapper) { 1612 return voice_engine_wrapper->base()->CreateChannel(voe_config_); 1613 } 1614 1615 int WebRtcVoiceEngine::CreateMediaVoiceChannel() { 1616 return CreateVoiceChannel(voe_wrapper_.get()); 1617 } 1618 1619 int WebRtcVoiceEngine::CreateSoundclipVoiceChannel() { 1620 return CreateVoiceChannel(voe_wrapper_sc_.get()); 1621 } 1622 1623 // This struct relies on the generated copy constructor and assignment operator 1624 // since it is used in an stl::map. 1625 struct WebRtcVoiceMediaChannel::WebRtcVoiceChannelInfo { 1626 WebRtcVoiceChannelInfo() : channel(-1), renderer(NULL) {} 1627 WebRtcVoiceChannelInfo(int ch, AudioRenderer* r) 1628 : channel(ch), 1629 renderer(r) {} 1630 ~WebRtcVoiceChannelInfo() {} 1631 1632 int channel; 1633 AudioRenderer* renderer; 1634 }; 1635 1636 // WebRtcVoiceMediaChannel 1637 WebRtcVoiceMediaChannel::WebRtcVoiceMediaChannel(WebRtcVoiceEngine *engine) 1638 : WebRtcMediaChannel<VoiceMediaChannel, WebRtcVoiceEngine>( 1639 engine, 1640 engine->CreateMediaVoiceChannel()), 1641 send_bw_setting_(false), 1642 send_autobw_(false), 1643 send_bw_bps_(0), 1644 options_(), 1645 dtmf_allowed_(false), 1646 desired_playout_(false), 1647 nack_enabled_(false), 1648 playout_(false), 1649 typing_noise_detected_(false), 1650 desired_send_(SEND_NOTHING), 1651 send_(SEND_NOTHING), 1652 default_receive_ssrc_(0) { 1653 engine->RegisterChannel(this); 1654 LOG(LS_VERBOSE) << "WebRtcVoiceMediaChannel::WebRtcVoiceMediaChannel " 1655 << voe_channel(); 1656 1657 ConfigureSendChannel(voe_channel()); 1658 } 1659 1660 WebRtcVoiceMediaChannel::~WebRtcVoiceMediaChannel() { 1661 LOG(LS_VERBOSE) << "WebRtcVoiceMediaChannel::~WebRtcVoiceMediaChannel " 1662 << voe_channel(); 1663 1664 // Remove any remaining send streams, the default channel will be deleted 1665 // later. 1666 while (!send_channels_.empty()) 1667 RemoveSendStream(send_channels_.begin()->first); 1668 1669 // Unregister ourselves from the engine. 1670 engine()->UnregisterChannel(this); 1671 // Remove any remaining streams. 1672 while (!receive_channels_.empty()) { 1673 RemoveRecvStream(receive_channels_.begin()->first); 1674 } 1675 1676 // Delete the default channel. 1677 DeleteChannel(voe_channel()); 1678 } 1679 1680 bool WebRtcVoiceMediaChannel::SetOptions(const AudioOptions& options) { 1681 LOG(LS_INFO) << "Setting voice channel options: " 1682 << options.ToString(); 1683 1684 // Check if DSCP value is changed from previous. 1685 bool dscp_option_changed = (options_.dscp != options.dscp); 1686 1687 // TODO(xians): Add support to set different options for different send 1688 // streams after we support multiple APMs. 1689 1690 // We retain all of the existing options, and apply the given ones 1691 // on top. This means there is no way to "clear" options such that 1692 // they go back to the engine default. 1693 options_.SetAll(options); 1694 1695 if (send_ != SEND_NOTHING) { 1696 if (!engine()->SetOptionOverrides(options_)) { 1697 LOG(LS_WARNING) << 1698 "Failed to engine SetOptionOverrides during channel SetOptions."; 1699 return false; 1700 } 1701 } else { 1702 // Will be interpreted when appropriate. 1703 } 1704 1705 // Receiver-side auto gain control happens per channel, so set it here from 1706 // options. Note that, like conference mode, setting it on the engine won't 1707 // have the desired effect, since voice channels don't inherit options from 1708 // the media engine when those options are applied per-channel. 1709 bool rx_auto_gain_control; 1710 if (options.rx_auto_gain_control.Get(&rx_auto_gain_control)) { 1711 if (engine()->voe()->processing()->SetRxAgcStatus( 1712 voe_channel(), rx_auto_gain_control, 1713 webrtc::kAgcFixedDigital) == -1) { 1714 LOG_RTCERR1(SetRxAgcStatus, rx_auto_gain_control); 1715 return false; 1716 } else { 1717 LOG(LS_VERBOSE) << "Rx auto gain set to " << rx_auto_gain_control 1718 << " with mode " << webrtc::kAgcFixedDigital; 1719 } 1720 } 1721 if (options.rx_agc_target_dbov.IsSet() || 1722 options.rx_agc_digital_compression_gain.IsSet() || 1723 options.rx_agc_limiter.IsSet()) { 1724 webrtc::AgcConfig config; 1725 // If only some of the options are being overridden, get the current 1726 // settings for the channel and bail if they aren't available. 1727 if (!options.rx_agc_target_dbov.IsSet() || 1728 !options.rx_agc_digital_compression_gain.IsSet() || 1729 !options.rx_agc_limiter.IsSet()) { 1730 if (engine()->voe()->processing()->GetRxAgcConfig( 1731 voe_channel(), config) != 0) { 1732 LOG(LS_ERROR) << "Failed to get default rx agc configuration for " 1733 << "channel " << voe_channel() << ". Since not all rx " 1734 << "agc options are specified, unable to safely set rx " 1735 << "agc options."; 1736 return false; 1737 } 1738 } 1739 config.targetLeveldBOv = 1740 options.rx_agc_target_dbov.GetWithDefaultIfUnset( 1741 config.targetLeveldBOv); 1742 config.digitalCompressionGaindB = 1743 options.rx_agc_digital_compression_gain.GetWithDefaultIfUnset( 1744 config.digitalCompressionGaindB); 1745 config.limiterEnable = options.rx_agc_limiter.GetWithDefaultIfUnset( 1746 config.limiterEnable); 1747 if (engine()->voe()->processing()->SetRxAgcConfig( 1748 voe_channel(), config) == -1) { 1749 LOG_RTCERR4(SetRxAgcConfig, voe_channel(), config.targetLeveldBOv, 1750 config.digitalCompressionGaindB, config.limiterEnable); 1751 return false; 1752 } 1753 } 1754 if (dscp_option_changed) { 1755 talk_base::DiffServCodePoint dscp = talk_base::DSCP_DEFAULT; 1756 if (options.dscp.GetWithDefaultIfUnset(false)) 1757 dscp = kAudioDscpValue; 1758 if (MediaChannel::SetDscp(dscp) != 0) { 1759 LOG(LS_WARNING) << "Failed to set DSCP settings for audio channel"; 1760 } 1761 } 1762 1763 LOG(LS_INFO) << "Set voice channel options. Current options: " 1764 << options_.ToString(); 1765 return true; 1766 } 1767 1768 bool WebRtcVoiceMediaChannel::SetRecvCodecs( 1769 const std::vector<AudioCodec>& codecs) { 1770 // Set the payload types to be used for incoming media. 1771 LOG(LS_INFO) << "Setting receive voice codecs:"; 1772 1773 std::vector<AudioCodec> new_codecs; 1774 // Find all new codecs. We allow adding new codecs but don't allow changing 1775 // the payload type of codecs that is already configured since we might 1776 // already be receiving packets with that payload type. 1777 for (std::vector<AudioCodec>::const_iterator it = codecs.begin(); 1778 it != codecs.end(); ++it) { 1779 AudioCodec old_codec; 1780 if (FindCodec(recv_codecs_, *it, &old_codec)) { 1781 if (old_codec.id != it->id) { 1782 LOG(LS_ERROR) << it->name << " payload type changed."; 1783 return false; 1784 } 1785 } else { 1786 new_codecs.push_back(*it); 1787 } 1788 } 1789 if (new_codecs.empty()) { 1790 // There are no new codecs to configure. Already configured codecs are 1791 // never removed. 1792 return true; 1793 } 1794 1795 if (playout_) { 1796 // Receive codecs can not be changed while playing. So we temporarily 1797 // pause playout. 1798 PausePlayout(); 1799 } 1800 1801 bool ret = true; 1802 for (std::vector<AudioCodec>::const_iterator it = new_codecs.begin(); 1803 it != new_codecs.end() && ret; ++it) { 1804 webrtc::CodecInst voe_codec; 1805 if (engine()->FindWebRtcCodec(*it, &voe_codec)) { 1806 LOG(LS_INFO) << ToString(*it); 1807 voe_codec.pltype = it->id; 1808 if (default_receive_ssrc_ == 0) { 1809 // Set the receive codecs on the default channel explicitly if the 1810 // default channel is not used by |receive_channels_|, this happens in 1811 // conference mode or in non-conference mode when there is no playout 1812 // channel. 1813 // TODO(xians): Figure out how we use the default channel in conference 1814 // mode. 1815 if (engine()->voe()->codec()->SetRecPayloadType( 1816 voe_channel(), voe_codec) == -1) { 1817 LOG_RTCERR2(SetRecPayloadType, voe_channel(), ToString(voe_codec)); 1818 ret = false; 1819 } 1820 } 1821 1822 // Set the receive codecs on all receiving channels. 1823 for (ChannelMap::iterator it = receive_channels_.begin(); 1824 it != receive_channels_.end() && ret; ++it) { 1825 if (engine()->voe()->codec()->SetRecPayloadType( 1826 it->second.channel, voe_codec) == -1) { 1827 LOG_RTCERR2(SetRecPayloadType, it->second.channel, 1828 ToString(voe_codec)); 1829 ret = false; 1830 } 1831 } 1832 } else { 1833 LOG(LS_WARNING) << "Unknown codec " << ToString(*it); 1834 ret = false; 1835 } 1836 } 1837 if (ret) { 1838 recv_codecs_ = codecs; 1839 } 1840 1841 if (desired_playout_ && !playout_) { 1842 ResumePlayout(); 1843 } 1844 return ret; 1845 } 1846 1847 bool WebRtcVoiceMediaChannel::SetSendCodecs( 1848 int channel, const std::vector<AudioCodec>& codecs) { 1849 // Disable VAD, and FEC unless we know the other side wants them. 1850 engine()->voe()->codec()->SetVADStatus(channel, false); 1851 engine()->voe()->rtp()->SetNACKStatus(channel, false, 0); 1852 engine()->voe()->rtp()->SetFECStatus(channel, false); 1853 1854 // Scan through the list to figure out the codec to use for sending, along 1855 // with the proper configuration for VAD and DTMF. 1856 bool first = true; 1857 webrtc::CodecInst send_codec; 1858 memset(&send_codec, 0, sizeof(send_codec)); 1859 1860 for (std::vector<AudioCodec>::const_iterator it = codecs.begin(); 1861 it != codecs.end(); ++it) { 1862 // Ignore codecs we don't know about. The negotiation step should prevent 1863 // this, but double-check to be sure. 1864 webrtc::CodecInst voe_codec; 1865 if (!engine()->FindWebRtcCodec(*it, &voe_codec)) { 1866 LOG(LS_WARNING) << "Unknown codec " << ToString(voe_codec); 1867 continue; 1868 } 1869 1870 // If OPUS, change what we send according to the "stereo" codec 1871 // parameter, and not the "channels" parameter. We set 1872 // voe_codec.channels to 2 if "stereo=1" and 1 otherwise. If 1873 // the bitrate is not specified, i.e. is zero, we set it to the 1874 // appropriate default value for mono or stereo Opus. 1875 if (IsOpus(*it)) { 1876 if (IsOpusStereoEnabled(*it)) { 1877 voe_codec.channels = 2; 1878 if (!IsValidOpusBitrate(it->bitrate)) { 1879 if (it->bitrate != 0) { 1880 LOG(LS_WARNING) << "Overrides the invalid supplied bitrate(" 1881 << it->bitrate 1882 << ") with default opus stereo bitrate: " 1883 << kOpusStereoBitrate; 1884 } 1885 voe_codec.rate = kOpusStereoBitrate; 1886 } 1887 } else { 1888 voe_codec.channels = 1; 1889 if (!IsValidOpusBitrate(it->bitrate)) { 1890 if (it->bitrate != 0) { 1891 LOG(LS_WARNING) << "Overrides the invalid supplied bitrate(" 1892 << it->bitrate 1893 << ") with default opus mono bitrate: " 1894 << kOpusMonoBitrate; 1895 } 1896 voe_codec.rate = kOpusMonoBitrate; 1897 } 1898 } 1899 int bitrate_from_params = GetOpusBitrateFromParams(*it); 1900 if (bitrate_from_params != 0) { 1901 voe_codec.rate = bitrate_from_params; 1902 } 1903 } 1904 1905 // Find the DTMF telephone event "codec" and tell VoiceEngine channels 1906 // about it. 1907 if (_stricmp(it->name.c_str(), "telephone-event") == 0 || 1908 _stricmp(it->name.c_str(), "audio/telephone-event") == 0) { 1909 if (engine()->voe()->dtmf()->SetSendTelephoneEventPayloadType( 1910 channel, it->id) == -1) { 1911 LOG_RTCERR2(SetSendTelephoneEventPayloadType, channel, it->id); 1912 return false; 1913 } 1914 } 1915 1916 // Turn voice activity detection/comfort noise on if supported. 1917 // Set the wideband CN payload type appropriately. 1918 // (narrowband always uses the static payload type 13). 1919 if (_stricmp(it->name.c_str(), "CN") == 0) { 1920 webrtc::PayloadFrequencies cn_freq; 1921 switch (it->clockrate) { 1922 case 8000: 1923 cn_freq = webrtc::kFreq8000Hz; 1924 break; 1925 case 16000: 1926 cn_freq = webrtc::kFreq16000Hz; 1927 break; 1928 case 32000: 1929 cn_freq = webrtc::kFreq32000Hz; 1930 break; 1931 default: 1932 LOG(LS_WARNING) << "CN frequency " << it->clockrate 1933 << " not supported."; 1934 continue; 1935 } 1936 // Set the CN payloadtype and the VAD status. 1937 // The CN payload type for 8000 Hz clockrate is fixed at 13. 1938 if (cn_freq != webrtc::kFreq8000Hz) { 1939 if (engine()->voe()->codec()->SetSendCNPayloadType( 1940 channel, it->id, cn_freq) == -1) { 1941 LOG_RTCERR3(SetSendCNPayloadType, channel, it->id, cn_freq); 1942 // TODO(ajm): This failure condition will be removed from VoE. 1943 // Restore the return here when we update to a new enough webrtc. 1944 // 1945 // Not returning false because the SetSendCNPayloadType will fail if 1946 // the channel is already sending. 1947 // This can happen if the remote description is applied twice, for 1948 // example in the case of ROAP on top of JSEP, where both side will 1949 // send the offer. 1950 } 1951 } 1952 1953 // Only turn on VAD if we have a CN payload type that matches the 1954 // clockrate for the codec we are going to use. 1955 if (it->clockrate == send_codec.plfreq) { 1956 LOG(LS_INFO) << "Enabling VAD"; 1957 if (engine()->voe()->codec()->SetVADStatus(channel, true) == -1) { 1958 LOG_RTCERR2(SetVADStatus, channel, true); 1959 return false; 1960 } 1961 } 1962 } 1963 1964 // We'll use the first codec in the list to actually send audio data. 1965 // Be sure to use the payload type requested by the remote side. 1966 // "red", for FEC audio, is a special case where the actual codec to be 1967 // used is specified in params. 1968 if (first) { 1969 if (_stricmp(it->name.c_str(), "red") == 0) { 1970 // Parse out the RED parameters. If we fail, just ignore RED; 1971 // we don't support all possible params/usage scenarios. 1972 if (!GetRedSendCodec(*it, codecs, &send_codec)) { 1973 continue; 1974 } 1975 1976 // Enable redundant encoding of the specified codec. Treat any 1977 // failure as a fatal internal error. 1978 LOG(LS_INFO) << "Enabling FEC"; 1979 if (engine()->voe()->rtp()->SetFECStatus(channel, true, it->id) == -1) { 1980 LOG_RTCERR3(SetFECStatus, channel, true, it->id); 1981 return false; 1982 } 1983 } else { 1984 send_codec = voe_codec; 1985 nack_enabled_ = IsNackEnabled(*it); 1986 SetNack(channel, nack_enabled_); 1987 } 1988 first = false; 1989 // Set the codec immediately, since SetVADStatus() depends on whether 1990 // the current codec is mono or stereo. 1991 if (!SetSendCodec(channel, send_codec)) 1992 return false; 1993 } 1994 } 1995 1996 // If we're being asked to set an empty list of codecs, due to a buggy client, 1997 // choose the most common format: PCMU 1998 if (first) { 1999 LOG(LS_WARNING) << "Received empty list of codecs; using PCMU/8000"; 2000 AudioCodec codec(0, "PCMU", 8000, 0, 1, 0); 2001 engine()->FindWebRtcCodec(codec, &send_codec); 2002 if (!SetSendCodec(channel, send_codec)) 2003 return false; 2004 } 2005 2006 // Always update the |send_codec_| to the currently set send codec. 2007 send_codec_.reset(new webrtc::CodecInst(send_codec)); 2008 2009 if (send_bw_setting_) { 2010 SetSendBandwidthInternal(send_autobw_, send_bw_bps_); 2011 } 2012 2013 return true; 2014 } 2015 2016 bool WebRtcVoiceMediaChannel::SetSendCodecs( 2017 const std::vector<AudioCodec>& codecs) { 2018 dtmf_allowed_ = false; 2019 for (std::vector<AudioCodec>::const_iterator it = codecs.begin(); 2020 it != codecs.end(); ++it) { 2021 // Find the DTMF telephone event "codec". 2022 if (_stricmp(it->name.c_str(), "telephone-event") == 0 || 2023 _stricmp(it->name.c_str(), "audio/telephone-event") == 0) { 2024 dtmf_allowed_ = true; 2025 } 2026 } 2027 2028 // Cache the codecs in order to configure the channel created later. 2029 send_codecs_ = codecs; 2030 for (ChannelMap::iterator iter = send_channels_.begin(); 2031 iter != send_channels_.end(); ++iter) { 2032 if (!SetSendCodecs(iter->second.channel, codecs)) { 2033 return false; 2034 } 2035 } 2036 2037 SetNack(receive_channels_, nack_enabled_); 2038 2039 return true; 2040 } 2041 2042 void WebRtcVoiceMediaChannel::SetNack(const ChannelMap& channels, 2043 bool nack_enabled) { 2044 for (ChannelMap::const_iterator it = channels.begin(); 2045 it != channels.end(); ++it) { 2046 SetNack(it->second.channel, nack_enabled); 2047 } 2048 } 2049 2050 void WebRtcVoiceMediaChannel::SetNack(int channel, bool nack_enabled) { 2051 if (nack_enabled) { 2052 LOG(LS_INFO) << "Enabling NACK for channel " << channel; 2053 engine()->voe()->rtp()->SetNACKStatus(channel, true, kNackMaxPackets); 2054 } else { 2055 LOG(LS_INFO) << "Disabling NACK for channel " << channel; 2056 engine()->voe()->rtp()->SetNACKStatus(channel, false, 0); 2057 } 2058 } 2059 2060 bool WebRtcVoiceMediaChannel::SetSendCodec( 2061 const webrtc::CodecInst& send_codec) { 2062 LOG(LS_INFO) << "Selected voice codec " << ToString(send_codec) 2063 << ", bitrate=" << send_codec.rate; 2064 for (ChannelMap::iterator iter = send_channels_.begin(); 2065 iter != send_channels_.end(); ++iter) { 2066 if (!SetSendCodec(iter->second.channel, send_codec)) 2067 return false; 2068 } 2069 2070 return true; 2071 } 2072 2073 bool WebRtcVoiceMediaChannel::SetSendCodec( 2074 int channel, const webrtc::CodecInst& send_codec) { 2075 LOG(LS_INFO) << "Send channel " << channel << " selected voice codec " 2076 << ToString(send_codec) << ", bitrate=" << send_codec.rate; 2077 2078 if (engine()->voe()->codec()->SetSendCodec(channel, send_codec) == -1) { 2079 LOG_RTCERR2(SetSendCodec, channel, ToString(send_codec)); 2080 return false; 2081 } 2082 return true; 2083 } 2084 2085 bool WebRtcVoiceMediaChannel::SetRecvRtpHeaderExtensions( 2086 const std::vector<RtpHeaderExtension>& extensions) { 2087 // We don't support any incoming extensions headers right now. 2088 return true; 2089 } 2090 2091 bool WebRtcVoiceMediaChannel::SetSendRtpHeaderExtensions( 2092 const std::vector<RtpHeaderExtension>& extensions) { 2093 // Enable the audio level extension header if requested. 2094 std::vector<RtpHeaderExtension>::const_iterator it; 2095 for (it = extensions.begin(); it != extensions.end(); ++it) { 2096 if (it->uri == kRtpAudioLevelHeaderExtension) { 2097 break; 2098 } 2099 } 2100 2101 bool enable = (it != extensions.end()); 2102 int id = 0; 2103 2104 if (enable) { 2105 id = it->id; 2106 if (id < kMinRtpHeaderExtensionId || 2107 id > kMaxRtpHeaderExtensionId) { 2108 LOG(LS_WARNING) << "Invalid RTP header extension id " << id; 2109 return false; 2110 } 2111 } 2112 2113 LOG(LS_INFO) << "Enabling audio level header extension with ID " << id; 2114 for (ChannelMap::const_iterator iter = send_channels_.begin(); 2115 iter != send_channels_.end(); ++iter) { 2116 if (engine()->voe()->rtp()->SetRTPAudioLevelIndicationStatus( 2117 iter->second.channel, enable, id) == -1) { 2118 LOG_RTCERR3(SetRTPAudioLevelIndicationStatus, 2119 iter->second.channel, enable, id); 2120 return false; 2121 } 2122 } 2123 2124 return true; 2125 } 2126 2127 bool WebRtcVoiceMediaChannel::SetPlayout(bool playout) { 2128 desired_playout_ = playout; 2129 return ChangePlayout(desired_playout_); 2130 } 2131 2132 bool WebRtcVoiceMediaChannel::PausePlayout() { 2133 return ChangePlayout(false); 2134 } 2135 2136 bool WebRtcVoiceMediaChannel::ResumePlayout() { 2137 return ChangePlayout(desired_playout_); 2138 } 2139 2140 bool WebRtcVoiceMediaChannel::ChangePlayout(bool playout) { 2141 if (playout_ == playout) { 2142 return true; 2143 } 2144 2145 // Change the playout of all channels to the new state. 2146 bool result = true; 2147 if (receive_channels_.empty()) { 2148 // Only toggle the default channel if we don't have any other channels. 2149 result = SetPlayout(voe_channel(), playout); 2150 } 2151 for (ChannelMap::iterator it = receive_channels_.begin(); 2152 it != receive_channels_.end() && result; ++it) { 2153 if (!SetPlayout(it->second.channel, playout)) { 2154 LOG(LS_ERROR) << "SetPlayout " << playout << " on channel " 2155 << it->second.channel << " failed"; 2156 result = false; 2157 } 2158 } 2159 2160 if (result) { 2161 playout_ = playout; 2162 } 2163 return result; 2164 } 2165 2166 bool WebRtcVoiceMediaChannel::SetSend(SendFlags send) { 2167 desired_send_ = send; 2168 if (!send_channels_.empty()) 2169 return ChangeSend(desired_send_); 2170 return true; 2171 } 2172 2173 bool WebRtcVoiceMediaChannel::PauseSend() { 2174 return ChangeSend(SEND_NOTHING); 2175 } 2176 2177 bool WebRtcVoiceMediaChannel::ResumeSend() { 2178 return ChangeSend(desired_send_); 2179 } 2180 2181 bool WebRtcVoiceMediaChannel::ChangeSend(SendFlags send) { 2182 if (send_ == send) { 2183 return true; 2184 } 2185 2186 // Change the settings on each send channel. 2187 if (send == SEND_MICROPHONE) 2188 engine()->SetOptionOverrides(options_); 2189 2190 // Change the settings on each send channel. 2191 for (ChannelMap::iterator iter = send_channels_.begin(); 2192 iter != send_channels_.end(); ++iter) { 2193 if (!ChangeSend(iter->second.channel, send)) 2194 return false; 2195 } 2196 2197 // Clear up the options after stopping sending. 2198 if (send == SEND_NOTHING) 2199 engine()->ClearOptionOverrides(); 2200 2201 send_ = send; 2202 return true; 2203 } 2204 2205 bool WebRtcVoiceMediaChannel::ChangeSend(int channel, SendFlags send) { 2206 if (send == SEND_MICROPHONE) { 2207 if (engine()->voe()->base()->StartSend(channel) == -1) { 2208 LOG_RTCERR1(StartSend, channel); 2209 return false; 2210 } 2211 if (engine()->voe()->file() && 2212 engine()->voe()->file()->StopPlayingFileAsMicrophone(channel) == -1) { 2213 LOG_RTCERR1(StopPlayingFileAsMicrophone, channel); 2214 return false; 2215 } 2216 } else { // SEND_NOTHING 2217 ASSERT(send == SEND_NOTHING); 2218 if (engine()->voe()->base()->StopSend(channel) == -1) { 2219 LOG_RTCERR1(StopSend, channel); 2220 return false; 2221 } 2222 } 2223 2224 return true; 2225 } 2226 2227 void WebRtcVoiceMediaChannel::ConfigureSendChannel(int channel) { 2228 if (engine()->voe()->network()->RegisterExternalTransport( 2229 channel, *this) == -1) { 2230 LOG_RTCERR2(RegisterExternalTransport, channel, this); 2231 } 2232 2233 // Enable RTCP (for quality stats and feedback messages) 2234 EnableRtcp(channel); 2235 2236 // Reset all recv codecs; they will be enabled via SetRecvCodecs. 2237 ResetRecvCodecs(channel); 2238 } 2239 2240 bool WebRtcVoiceMediaChannel::DeleteChannel(int channel) { 2241 if (engine()->voe()->network()->DeRegisterExternalTransport(channel) == -1) { 2242 LOG_RTCERR1(DeRegisterExternalTransport, channel); 2243 } 2244 2245 if (engine()->voe()->base()->DeleteChannel(channel) == -1) { 2246 LOG_RTCERR1(DeleteChannel, channel); 2247 return false; 2248 } 2249 2250 return true; 2251 } 2252 2253 bool WebRtcVoiceMediaChannel::AddSendStream(const StreamParams& sp) { 2254 // If the default channel is already used for sending create a new channel 2255 // otherwise use the default channel for sending. 2256 int channel = GetSendChannelNum(sp.first_ssrc()); 2257 if (channel != -1) { 2258 LOG(LS_ERROR) << "Stream already exists with ssrc " << sp.first_ssrc(); 2259 return false; 2260 } 2261 2262 bool default_channel_is_available = true; 2263 for (ChannelMap::const_iterator iter = send_channels_.begin(); 2264 iter != send_channels_.end(); ++iter) { 2265 if (IsDefaultChannel(iter->second.channel)) { 2266 default_channel_is_available = false; 2267 break; 2268 } 2269 } 2270 if (default_channel_is_available) { 2271 channel = voe_channel(); 2272 } else { 2273 // Create a new channel for sending audio data. 2274 channel = engine()->CreateMediaVoiceChannel(); 2275 if (channel == -1) { 2276 LOG_RTCERR0(CreateChannel); 2277 return false; 2278 } 2279 2280 ConfigureSendChannel(channel); 2281 } 2282 2283 // Save the channel to send_channels_, so that RemoveSendStream() can still 2284 // delete the channel in case failure happens below. 2285 send_channels_[sp.first_ssrc()] = WebRtcVoiceChannelInfo(channel, NULL); 2286 2287 // Set the send (local) SSRC. 2288 // If there are multiple send SSRCs, we can only set the first one here, and 2289 // the rest of the SSRC(s) need to be set after SetSendCodec has been called 2290 // (with a codec requires multiple SSRC(s)). 2291 if (engine()->voe()->rtp()->SetLocalSSRC(channel, sp.first_ssrc()) == -1) { 2292 LOG_RTCERR2(SetSendSSRC, channel, sp.first_ssrc()); 2293 return false; 2294 } 2295 2296 // At this point the channel's local SSRC has been updated. If the channel is 2297 // the default channel make sure that all the receive channels are updated as 2298 // well. Receive channels have to have the same SSRC as the default channel in 2299 // order to send receiver reports with this SSRC. 2300 if (IsDefaultChannel(channel)) { 2301 for (ChannelMap::const_iterator it = receive_channels_.begin(); 2302 it != receive_channels_.end(); ++it) { 2303 // Only update the SSRC for non-default channels. 2304 if (!IsDefaultChannel(it->second.channel)) { 2305 if (engine()->voe()->rtp()->SetLocalSSRC(it->second.channel, 2306 sp.first_ssrc()) != 0) { 2307 LOG_RTCERR2(SetLocalSSRC, it->second.channel, sp.first_ssrc()); 2308 return false; 2309 } 2310 } 2311 } 2312 } 2313 2314 if (engine()->voe()->rtp()->SetRTCP_CNAME(channel, sp.cname.c_str()) == -1) { 2315 LOG_RTCERR2(SetRTCP_CNAME, channel, sp.cname); 2316 return false; 2317 } 2318 2319 // Set the current codecs to be used for the new channel. 2320 if (!send_codecs_.empty() && !SetSendCodecs(channel, send_codecs_)) 2321 return false; 2322 2323 return ChangeSend(channel, desired_send_); 2324 } 2325 2326 bool WebRtcVoiceMediaChannel::RemoveSendStream(uint32 ssrc) { 2327 ChannelMap::iterator it = send_channels_.find(ssrc); 2328 if (it == send_channels_.end()) { 2329 LOG(LS_WARNING) << "Try to remove stream with ssrc " << ssrc 2330 << " which doesn't exist."; 2331 return false; 2332 } 2333 2334 int channel = it->second.channel; 2335 ChangeSend(channel, SEND_NOTHING); 2336 2337 // Notify the audio renderer that the send channel is going away. 2338 if (it->second.renderer) 2339 it->second.renderer->RemoveChannel(channel); 2340 2341 if (IsDefaultChannel(channel)) { 2342 // Do not delete the default channel since the receive channels depend on 2343 // the default channel, recycle it instead. 2344 ChangeSend(channel, SEND_NOTHING); 2345 } else { 2346 // Clean up and delete the send channel. 2347 LOG(LS_INFO) << "Removing audio send stream " << ssrc 2348 << " with VoiceEngine channel #" << channel << "."; 2349 if (!DeleteChannel(channel)) 2350 return false; 2351 } 2352 2353 send_channels_.erase(it); 2354 if (send_channels_.empty()) 2355 ChangeSend(SEND_NOTHING); 2356 2357 return true; 2358 } 2359 2360 bool WebRtcVoiceMediaChannel::AddRecvStream(const StreamParams& sp) { 2361 talk_base::CritScope lock(&receive_channels_cs_); 2362 2363 if (!VERIFY(sp.ssrcs.size() == 1)) 2364 return false; 2365 uint32 ssrc = sp.first_ssrc(); 2366 2367 if (ssrc == 0) { 2368 LOG(LS_WARNING) << "AddRecvStream with 0 ssrc is not supported."; 2369 return false; 2370 } 2371 2372 if (receive_channels_.find(ssrc) != receive_channels_.end()) { 2373 LOG(LS_ERROR) << "Stream already exists with ssrc " << ssrc; 2374 return false; 2375 } 2376 2377 // Reuse default channel for recv stream in non-conference mode call 2378 // when the default channel is not being used. 2379 if (!InConferenceMode() && default_receive_ssrc_ == 0) { 2380 LOG(LS_INFO) << "Recv stream " << sp.first_ssrc() 2381 << " reuse default channel"; 2382 default_receive_ssrc_ = sp.first_ssrc(); 2383 receive_channels_.insert(std::make_pair( 2384 default_receive_ssrc_, WebRtcVoiceChannelInfo(voe_channel(), NULL))); 2385 return SetPlayout(voe_channel(), playout_); 2386 } 2387 2388 // Create a new channel for receiving audio data. 2389 int channel = engine()->CreateMediaVoiceChannel(); 2390 if (channel == -1) { 2391 LOG_RTCERR0(CreateChannel); 2392 return false; 2393 } 2394 2395 if (!ConfigureRecvChannel(channel)) { 2396 DeleteChannel(channel); 2397 return false; 2398 } 2399 2400 receive_channels_.insert( 2401 std::make_pair(ssrc, WebRtcVoiceChannelInfo(channel, NULL))); 2402 2403 LOG(LS_INFO) << "New audio stream " << ssrc 2404 << " registered to VoiceEngine channel #" 2405 << channel << "."; 2406 return true; 2407 } 2408 2409 bool WebRtcVoiceMediaChannel::ConfigureRecvChannel(int channel) { 2410 // Configure to use external transport, like our default channel. 2411 if (engine()->voe()->network()->RegisterExternalTransport( 2412 channel, *this) == -1) { 2413 LOG_RTCERR2(SetExternalTransport, channel, this); 2414 return false; 2415 } 2416 2417 // Use the same SSRC as our default channel (so the RTCP reports are correct). 2418 unsigned int send_ssrc; 2419 webrtc::VoERTP_RTCP* rtp = engine()->voe()->rtp(); 2420 if (rtp->GetLocalSSRC(voe_channel(), send_ssrc) == -1) { 2421 LOG_RTCERR2(GetSendSSRC, channel, send_ssrc); 2422 return false; 2423 } 2424 if (rtp->SetLocalSSRC(channel, send_ssrc) == -1) { 2425 LOG_RTCERR2(SetSendSSRC, channel, send_ssrc); 2426 return false; 2427 } 2428 2429 // Use the same recv payload types as our default channel. 2430 ResetRecvCodecs(channel); 2431 if (!recv_codecs_.empty()) { 2432 for (std::vector<AudioCodec>::const_iterator it = recv_codecs_.begin(); 2433 it != recv_codecs_.end(); ++it) { 2434 webrtc::CodecInst voe_codec; 2435 if (engine()->FindWebRtcCodec(*it, &voe_codec)) { 2436 voe_codec.pltype = it->id; 2437 voe_codec.rate = 0; // Needed to make GetRecPayloadType work for ISAC 2438 if (engine()->voe()->codec()->GetRecPayloadType( 2439 voe_channel(), voe_codec) != -1) { 2440 if (engine()->voe()->codec()->SetRecPayloadType( 2441 channel, voe_codec) == -1) { 2442 LOG_RTCERR2(SetRecPayloadType, channel, ToString(voe_codec)); 2443 return false; 2444 } 2445 } 2446 } 2447 } 2448 } 2449 2450 if (InConferenceMode()) { 2451 // To be in par with the video, voe_channel() is not used for receiving in 2452 // a conference call. 2453 if (receive_channels_.empty() && default_receive_ssrc_ == 0 && playout_) { 2454 // This is the first stream in a multi user meeting. We can now 2455 // disable playback of the default stream. This since the default 2456 // stream will probably have received some initial packets before 2457 // the new stream was added. This will mean that the CN state from 2458 // the default channel will be mixed in with the other streams 2459 // throughout the whole meeting, which might be disturbing. 2460 LOG(LS_INFO) << "Disabling playback on the default voice channel"; 2461 SetPlayout(voe_channel(), false); 2462 } 2463 } 2464 SetNack(channel, nack_enabled_); 2465 2466 return SetPlayout(channel, playout_); 2467 } 2468 2469 bool WebRtcVoiceMediaChannel::RemoveRecvStream(uint32 ssrc) { 2470 talk_base::CritScope lock(&receive_channels_cs_); 2471 ChannelMap::iterator it = receive_channels_.find(ssrc); 2472 if (it == receive_channels_.end()) { 2473 LOG(LS_WARNING) << "Try to remove stream with ssrc " << ssrc 2474 << " which doesn't exist."; 2475 return false; 2476 } 2477 2478 if (ssrc == default_receive_ssrc_) { 2479 ASSERT(IsDefaultChannel(it->second.channel)); 2480 // Recycle the default channel is for recv stream. 2481 if (playout_) 2482 SetPlayout(voe_channel(), false); 2483 2484 if (it->second.renderer) 2485 it->second.renderer->RemoveChannel(voe_channel()); 2486 2487 default_receive_ssrc_ = 0; 2488 receive_channels_.erase(it); 2489 return true; 2490 } 2491 2492 // Non default channel. 2493 // Notify the renderer that channel is going away. 2494 if (it->second.renderer) 2495 it->second.renderer->RemoveChannel(it->second.channel); 2496 2497 LOG(LS_INFO) << "Removing audio stream " << ssrc 2498 << " with VoiceEngine channel #" << it->second.channel << "."; 2499 if (!DeleteChannel(it->second.channel)) { 2500 // Erase the entry anyhow. 2501 receive_channels_.erase(it); 2502 return false; 2503 } 2504 2505 receive_channels_.erase(it); 2506 bool enable_default_channel_playout = false; 2507 if (receive_channels_.empty()) { 2508 // The last stream was removed. We can now enable the default 2509 // channel for new channels to be played out immediately without 2510 // waiting for AddStream messages. 2511 // We do this for both conference mode and non-conference mode. 2512 // TODO(oja): Does the default channel still have it's CN state? 2513 enable_default_channel_playout = true; 2514 } 2515 if (!InConferenceMode() && receive_channels_.size() == 1 && 2516 default_receive_ssrc_ != 0) { 2517 // Only the default channel is active, enable the playout on default 2518 // channel. 2519 enable_default_channel_playout = true; 2520 } 2521 if (enable_default_channel_playout && playout_) { 2522 LOG(LS_INFO) << "Enabling playback on the default voice channel"; 2523 SetPlayout(voe_channel(), true); 2524 } 2525 2526 return true; 2527 } 2528 2529 bool WebRtcVoiceMediaChannel::SetRemoteRenderer(uint32 ssrc, 2530 AudioRenderer* renderer) { 2531 ChannelMap::iterator it = receive_channels_.find(ssrc); 2532 if (it == receive_channels_.end()) { 2533 if (renderer) { 2534 // Return an error if trying to set a valid renderer with an invalid ssrc. 2535 LOG(LS_ERROR) << "SetRemoteRenderer failed with ssrc "<< ssrc; 2536 return false; 2537 } 2538 2539 // The channel likely has gone away, do nothing. 2540 return true; 2541 } 2542 2543 AudioRenderer* remote_renderer = it->second.renderer; 2544 if (renderer) { 2545 ASSERT(remote_renderer == NULL || remote_renderer == renderer); 2546 if (!remote_renderer) { 2547 renderer->AddChannel(it->second.channel); 2548 } 2549 } else if (remote_renderer) { 2550 // |renderer| == NULL, remove the channel from the renderer. 2551 remote_renderer->RemoveChannel(it->second.channel); 2552 } 2553 2554 // Assign the new value to the struct. 2555 it->second.renderer = renderer; 2556 return true; 2557 } 2558 2559 bool WebRtcVoiceMediaChannel::SetLocalRenderer(uint32 ssrc, 2560 AudioRenderer* renderer) { 2561 ChannelMap::iterator it = send_channels_.find(ssrc); 2562 if (it == send_channels_.end()) { 2563 if (renderer) { 2564 // Return an error if trying to set a valid renderer with an invalid ssrc. 2565 LOG(LS_ERROR) << "SetLocalRenderer failed with ssrc "<< ssrc; 2566 return false; 2567 } 2568 2569 // The channel likely has gone away, do nothing. 2570 return true; 2571 } 2572 2573 AudioRenderer* local_renderer = it->second.renderer; 2574 if (renderer) { 2575 ASSERT(local_renderer == NULL || local_renderer == renderer); 2576 if (!local_renderer) 2577 renderer->AddChannel(it->second.channel); 2578 } else if (local_renderer) { 2579 local_renderer->RemoveChannel(it->second.channel); 2580 } 2581 2582 // Assign the new value to the struct. 2583 it->second.renderer = renderer; 2584 return true; 2585 } 2586 2587 bool WebRtcVoiceMediaChannel::GetActiveStreams( 2588 AudioInfo::StreamList* actives) { 2589 // In conference mode, the default channel should not be in 2590 // |receive_channels_|. 2591 actives->clear(); 2592 for (ChannelMap::iterator it = receive_channels_.begin(); 2593 it != receive_channels_.end(); ++it) { 2594 int level = GetOutputLevel(it->second.channel); 2595 if (level > 0) { 2596 actives->push_back(std::make_pair(it->first, level)); 2597 } 2598 } 2599 return true; 2600 } 2601 2602 int WebRtcVoiceMediaChannel::GetOutputLevel() { 2603 // return the highest output level of all streams 2604 int highest = GetOutputLevel(voe_channel()); 2605 for (ChannelMap::iterator it = receive_channels_.begin(); 2606 it != receive_channels_.end(); ++it) { 2607 int level = GetOutputLevel(it->second.channel); 2608 highest = talk_base::_max(level, highest); 2609 } 2610 return highest; 2611 } 2612 2613 int WebRtcVoiceMediaChannel::GetTimeSinceLastTyping() { 2614 int ret; 2615 if (engine()->voe()->processing()->TimeSinceLastTyping(ret) == -1) { 2616 // In case of error, log the info and continue 2617 LOG_RTCERR0(TimeSinceLastTyping); 2618 ret = -1; 2619 } else { 2620 ret *= 1000; // We return ms, webrtc returns seconds. 2621 } 2622 return ret; 2623 } 2624 2625 void WebRtcVoiceMediaChannel::SetTypingDetectionParameters(int time_window, 2626 int cost_per_typing, int reporting_threshold, int penalty_decay, 2627 int type_event_delay) { 2628 if (engine()->voe()->processing()->SetTypingDetectionParameters( 2629 time_window, cost_per_typing, 2630 reporting_threshold, penalty_decay, type_event_delay) == -1) { 2631 // In case of error, log the info and continue 2632 LOG_RTCERR5(SetTypingDetectionParameters, time_window, 2633 cost_per_typing, reporting_threshold, penalty_decay, 2634 type_event_delay); 2635 } 2636 } 2637 2638 bool WebRtcVoiceMediaChannel::SetOutputScaling( 2639 uint32 ssrc, double left, double right) { 2640 talk_base::CritScope lock(&receive_channels_cs_); 2641 // Collect the channels to scale the output volume. 2642 std::vector<int> channels; 2643 if (0 == ssrc) { // Collect all channels, including the default one. 2644 // Default channel is not in receive_channels_ if it is not being used for 2645 // playout. 2646 if (default_receive_ssrc_ == 0) 2647 channels.push_back(voe_channel()); 2648 for (ChannelMap::const_iterator it = receive_channels_.begin(); 2649 it != receive_channels_.end(); ++it) { 2650 channels.push_back(it->second.channel); 2651 } 2652 } else { // Collect only the channel of the specified ssrc. 2653 int channel = GetReceiveChannelNum(ssrc); 2654 if (-1 == channel) { 2655 LOG(LS_WARNING) << "Cannot find channel for ssrc:" << ssrc; 2656 return false; 2657 } 2658 channels.push_back(channel); 2659 } 2660 2661 // Scale the output volume for the collected channels. We first normalize to 2662 // scale the volume and then set the left and right pan. 2663 float scale = static_cast<float>(talk_base::_max(left, right)); 2664 if (scale > 0.0001f) { 2665 left /= scale; 2666 right /= scale; 2667 } 2668 for (std::vector<int>::const_iterator it = channels.begin(); 2669 it != channels.end(); ++it) { 2670 if (-1 == engine()->voe()->volume()->SetChannelOutputVolumeScaling( 2671 *it, scale)) { 2672 LOG_RTCERR2(SetChannelOutputVolumeScaling, *it, scale); 2673 return false; 2674 } 2675 if (-1 == engine()->voe()->volume()->SetOutputVolumePan( 2676 *it, static_cast<float>(left), static_cast<float>(right))) { 2677 LOG_RTCERR3(SetOutputVolumePan, *it, left, right); 2678 // Do not return if fails. SetOutputVolumePan is not available for all 2679 // pltforms. 2680 } 2681 LOG(LS_INFO) << "SetOutputScaling to left=" << left * scale 2682 << " right=" << right * scale 2683 << " for channel " << *it << " and ssrc " << ssrc; 2684 } 2685 return true; 2686 } 2687 2688 bool WebRtcVoiceMediaChannel::GetOutputScaling( 2689 uint32 ssrc, double* left, double* right) { 2690 if (!left || !right) return false; 2691 2692 talk_base::CritScope lock(&receive_channels_cs_); 2693 // Determine which channel based on ssrc. 2694 int channel = (0 == ssrc) ? voe_channel() : GetReceiveChannelNum(ssrc); 2695 if (channel == -1) { 2696 LOG(LS_WARNING) << "Cannot find channel for ssrc:" << ssrc; 2697 return false; 2698 } 2699 2700 float scaling; 2701 if (-1 == engine()->voe()->volume()->GetChannelOutputVolumeScaling( 2702 channel, scaling)) { 2703 LOG_RTCERR2(GetChannelOutputVolumeScaling, channel, scaling); 2704 return false; 2705 } 2706 2707 float left_pan; 2708 float right_pan; 2709 if (-1 == engine()->voe()->volume()->GetOutputVolumePan( 2710 channel, left_pan, right_pan)) { 2711 LOG_RTCERR3(GetOutputVolumePan, channel, left_pan, right_pan); 2712 // If GetOutputVolumePan fails, we use the default left and right pan. 2713 left_pan = 1.0f; 2714 right_pan = 1.0f; 2715 } 2716 2717 *left = scaling * left_pan; 2718 *right = scaling * right_pan; 2719 return true; 2720 } 2721 2722 bool WebRtcVoiceMediaChannel::SetRingbackTone(const char *buf, int len) { 2723 ringback_tone_.reset(new WebRtcSoundclipStream(buf, len)); 2724 return true; 2725 } 2726 2727 bool WebRtcVoiceMediaChannel::PlayRingbackTone(uint32 ssrc, 2728 bool play, bool loop) { 2729 if (!ringback_tone_) { 2730 return false; 2731 } 2732 2733 // The voe file api is not available in chrome. 2734 if (!engine()->voe()->file()) { 2735 return false; 2736 } 2737 2738 // Determine which VoiceEngine channel to play on. 2739 int channel = (ssrc == 0) ? voe_channel() : GetReceiveChannelNum(ssrc); 2740 if (channel == -1) { 2741 return false; 2742 } 2743 2744 // Make sure the ringtone is cued properly, and play it out. 2745 if (play) { 2746 ringback_tone_->set_loop(loop); 2747 ringback_tone_->Rewind(); 2748 if (engine()->voe()->file()->StartPlayingFileLocally(channel, 2749 ringback_tone_.get()) == -1) { 2750 LOG_RTCERR2(StartPlayingFileLocally, channel, ringback_tone_.get()); 2751 LOG(LS_ERROR) << "Unable to start ringback tone"; 2752 return false; 2753 } 2754 ringback_channels_.insert(channel); 2755 LOG(LS_INFO) << "Started ringback on channel " << channel; 2756 } else { 2757 if (engine()->voe()->file()->IsPlayingFileLocally(channel) == 1 && 2758 engine()->voe()->file()->StopPlayingFileLocally(channel) == -1) { 2759 LOG_RTCERR1(StopPlayingFileLocally, channel); 2760 return false; 2761 } 2762 LOG(LS_INFO) << "Stopped ringback on channel " << channel; 2763 ringback_channels_.erase(channel); 2764 } 2765 2766 return true; 2767 } 2768 2769 bool WebRtcVoiceMediaChannel::CanInsertDtmf() { 2770 return dtmf_allowed_; 2771 } 2772 2773 bool WebRtcVoiceMediaChannel::InsertDtmf(uint32 ssrc, int event, 2774 int duration, int flags) { 2775 if (!dtmf_allowed_) { 2776 return false; 2777 } 2778 2779 // Send the event. 2780 if (flags & cricket::DF_SEND) { 2781 int channel = -1; 2782 if (ssrc == 0) { 2783 bool default_channel_is_inuse = false; 2784 for (ChannelMap::const_iterator iter = send_channels_.begin(); 2785 iter != send_channels_.end(); ++iter) { 2786 if (IsDefaultChannel(iter->second.channel)) { 2787 default_channel_is_inuse = true; 2788 break; 2789 } 2790 } 2791 if (default_channel_is_inuse) { 2792 channel = voe_channel(); 2793 } else if (!send_channels_.empty()) { 2794 channel = send_channels_.begin()->second.channel; 2795 } 2796 } else { 2797 channel = GetSendChannelNum(ssrc); 2798 } 2799 if (channel == -1) { 2800 LOG(LS_WARNING) << "InsertDtmf - The specified ssrc " 2801 << ssrc << " is not in use."; 2802 return false; 2803 } 2804 // Send DTMF using out-of-band DTMF. ("true", as 3rd arg) 2805 if (engine()->voe()->dtmf()->SendTelephoneEvent( 2806 channel, event, true, duration) == -1) { 2807 LOG_RTCERR4(SendTelephoneEvent, channel, event, true, duration); 2808 return false; 2809 } 2810 } 2811 2812 // Play the event. 2813 if (flags & cricket::DF_PLAY) { 2814 // Play DTMF tone locally. 2815 if (engine()->voe()->dtmf()->PlayDtmfTone(event, duration) == -1) { 2816 LOG_RTCERR2(PlayDtmfTone, event, duration); 2817 return false; 2818 } 2819 } 2820 2821 return true; 2822 } 2823 2824 void WebRtcVoiceMediaChannel::OnPacketReceived( 2825 talk_base::Buffer* packet, const talk_base::PacketTime& packet_time) { 2826 // Pick which channel to send this packet to. If this packet doesn't match 2827 // any multiplexed streams, just send it to the default channel. Otherwise, 2828 // send it to the specific decoder instance for that stream. 2829 int which_channel = GetReceiveChannelNum( 2830 ParseSsrc(packet->data(), packet->length(), false)); 2831 if (which_channel == -1) { 2832 which_channel = voe_channel(); 2833 } 2834 2835 // Stop any ringback that might be playing on the channel. 2836 // It's possible the ringback has already stopped, ih which case we'll just 2837 // use the opportunity to remove the channel from ringback_channels_. 2838 if (engine()->voe()->file()) { 2839 const std::set<int>::iterator it = ringback_channels_.find(which_channel); 2840 if (it != ringback_channels_.end()) { 2841 if (engine()->voe()->file()->IsPlayingFileLocally( 2842 which_channel) == 1) { 2843 engine()->voe()->file()->StopPlayingFileLocally(which_channel); 2844 LOG(LS_INFO) << "Stopped ringback on channel " << which_channel 2845 << " due to incoming media"; 2846 } 2847 ringback_channels_.erase(which_channel); 2848 } 2849 } 2850 2851 // Pass it off to the decoder. 2852 engine()->voe()->network()->ReceivedRTPPacket( 2853 which_channel, 2854 packet->data(), 2855 static_cast<unsigned int>(packet->length())); 2856 } 2857 2858 void WebRtcVoiceMediaChannel::OnRtcpReceived( 2859 talk_base::Buffer* packet, const talk_base::PacketTime& packet_time) { 2860 // Sending channels need all RTCP packets with feedback information. 2861 // Even sender reports can contain attached report blocks. 2862 // Receiving channels need sender reports in order to create 2863 // correct receiver reports. 2864 int type = 0; 2865 if (!GetRtcpType(packet->data(), packet->length(), &type)) { 2866 LOG(LS_WARNING) << "Failed to parse type from received RTCP packet"; 2867 return; 2868 } 2869 2870 // If it is a sender report, find the channel that is listening. 2871 bool has_sent_to_default_channel = false; 2872 if (type == kRtcpTypeSR) { 2873 int which_channel = GetReceiveChannelNum( 2874 ParseSsrc(packet->data(), packet->length(), true)); 2875 if (which_channel != -1) { 2876 engine()->voe()->network()->ReceivedRTCPPacket( 2877 which_channel, 2878 packet->data(), 2879 static_cast<unsigned int>(packet->length())); 2880 2881 if (IsDefaultChannel(which_channel)) 2882 has_sent_to_default_channel = true; 2883 } 2884 } 2885 2886 // SR may continue RR and any RR entry may correspond to any one of the send 2887 // channels. So all RTCP packets must be forwarded all send channels. VoE 2888 // will filter out RR internally. 2889 for (ChannelMap::iterator iter = send_channels_.begin(); 2890 iter != send_channels_.end(); ++iter) { 2891 // Make sure not sending the same packet to default channel more than once. 2892 if (IsDefaultChannel(iter->second.channel) && has_sent_to_default_channel) 2893 continue; 2894 2895 engine()->voe()->network()->ReceivedRTCPPacket( 2896 iter->second.channel, 2897 packet->data(), 2898 static_cast<unsigned int>(packet->length())); 2899 } 2900 } 2901 2902 bool WebRtcVoiceMediaChannel::MuteStream(uint32 ssrc, bool muted) { 2903 int channel = (ssrc == 0) ? voe_channel() : GetSendChannelNum(ssrc); 2904 if (channel == -1) { 2905 LOG(LS_WARNING) << "The specified ssrc " << ssrc << " is not in use."; 2906 return false; 2907 } 2908 if (engine()->voe()->volume()->SetInputMute(channel, muted) == -1) { 2909 LOG_RTCERR2(SetInputMute, channel, muted); 2910 return false; 2911 } 2912 return true; 2913 } 2914 2915 bool WebRtcVoiceMediaChannel::SetSendBandwidth(bool autobw, int bps) { 2916 LOG(LS_INFO) << "WebRtcVoiceMediaChanne::SetSendBandwidth."; 2917 2918 send_bw_setting_ = true; 2919 send_autobw_ = autobw; 2920 send_bw_bps_ = bps; 2921 2922 return SetSendBandwidthInternal(send_autobw_, send_bw_bps_); 2923 } 2924 2925 bool WebRtcVoiceMediaChannel::SetSendBandwidthInternal(bool autobw, int bps) { 2926 LOG(LS_INFO) << "WebRtcVoiceMediaChanne::SetSendBandwidthInternal."; 2927 2928 if (!send_codec_) { 2929 LOG(LS_INFO) << "The send codec has not been set up yet. " 2930 << "The send bandwidth setting will be applied later."; 2931 return true; 2932 } 2933 2934 // Bandwidth is auto by default. 2935 if (autobw || bps <= 0) 2936 return true; 2937 2938 webrtc::CodecInst codec = *send_codec_; 2939 bool is_multi_rate = IsCodecMultiRate(codec); 2940 2941 if (is_multi_rate) { 2942 // If codec is multi-rate then just set the bitrate. 2943 codec.rate = bps; 2944 if (!SetSendCodec(codec)) { 2945 LOG(LS_INFO) << "Failed to set codec " << codec.plname 2946 << " to bitrate " << bps << " bps."; 2947 return false; 2948 } 2949 return true; 2950 } else { 2951 // If codec is not multi-rate and |bps| is less than the fixed bitrate 2952 // then fail. If codec is not multi-rate and |bps| exceeds or equal the 2953 // fixed bitrate then ignore. 2954 if (bps < codec.rate) { 2955 LOG(LS_INFO) << "Failed to set codec " << codec.plname 2956 << " to bitrate " << bps << " bps" 2957 << ", requires at least " << codec.rate << " bps."; 2958 return false; 2959 } 2960 return true; 2961 } 2962 } 2963 2964 bool WebRtcVoiceMediaChannel::GetStats(VoiceMediaInfo* info) { 2965 bool echo_metrics_on = false; 2966 // These can take on valid negative values, so use the lowest possible level 2967 // as default rather than -1. 2968 int echo_return_loss = -100; 2969 int echo_return_loss_enhancement = -100; 2970 // These can also be negative, but in practice -1 is only used to signal 2971 // insufficient data, since the resolution is limited to multiples of 4 ms. 2972 int echo_delay_median_ms = -1; 2973 int echo_delay_std_ms = -1; 2974 if (engine()->voe()->processing()->GetEcMetricsStatus( 2975 echo_metrics_on) != -1 && echo_metrics_on) { 2976 // TODO(ajm): we may want to use VoECallReport::GetEchoMetricsSummary 2977 // here, but it appears to be unsuitable currently. Revisit after this is 2978 // investigated: http://b/issue?id=5666755 2979 int erl, erle, rerl, anlp; 2980 if (engine()->voe()->processing()->GetEchoMetrics( 2981 erl, erle, rerl, anlp) != -1) { 2982 echo_return_loss = erl; 2983 echo_return_loss_enhancement = erle; 2984 } 2985 2986 int median, std; 2987 if (engine()->voe()->processing()->GetEcDelayMetrics(median, std) != -1) { 2988 echo_delay_median_ms = median; 2989 echo_delay_std_ms = std; 2990 } 2991 } 2992 2993 webrtc::CallStatistics cs; 2994 unsigned int ssrc; 2995 webrtc::CodecInst codec; 2996 unsigned int level; 2997 2998 for (ChannelMap::const_iterator channel_iter = send_channels_.begin(); 2999 channel_iter != send_channels_.end(); ++channel_iter) { 3000 const int channel = channel_iter->second.channel; 3001 3002 // Fill in the sender info, based on what we know, and what the 3003 // remote side told us it got from its RTCP report. 3004 VoiceSenderInfo sinfo; 3005 3006 if (engine()->voe()->rtp()->GetRTCPStatistics(channel, cs) == -1 || 3007 engine()->voe()->rtp()->GetLocalSSRC(channel, ssrc) == -1) { 3008 continue; 3009 } 3010 3011 sinfo.add_ssrc(ssrc); 3012 sinfo.codec_name = send_codec_.get() ? send_codec_->plname : ""; 3013 sinfo.bytes_sent = cs.bytesSent; 3014 sinfo.packets_sent = cs.packetsSent; 3015 // RTT isn't known until a RTCP report is received. Until then, VoiceEngine 3016 // returns 0 to indicate an error value. 3017 sinfo.rtt_ms = (cs.rttMs > 0) ? cs.rttMs : -1; 3018 3019 // Get data from the last remote RTCP report. Use default values if no data 3020 // available. 3021 sinfo.fraction_lost = -1.0; 3022 sinfo.jitter_ms = -1; 3023 sinfo.packets_lost = -1; 3024 sinfo.ext_seqnum = -1; 3025 std::vector<webrtc::ReportBlock> receive_blocks; 3026 if (engine()->voe()->rtp()->GetRemoteRTCPReportBlocks( 3027 channel, &receive_blocks) != -1 && 3028 engine()->voe()->codec()->GetSendCodec(channel, codec) != -1) { 3029 std::vector<webrtc::ReportBlock>::iterator iter; 3030 for (iter = receive_blocks.begin(); iter != receive_blocks.end(); 3031 ++iter) { 3032 // Lookup report for send ssrc only. 3033 if (iter->source_SSRC == sinfo.ssrc()) { 3034 // Convert Q8 to floating point. 3035 sinfo.fraction_lost = static_cast<float>(iter->fraction_lost) / 256; 3036 // Convert samples to milliseconds. 3037 if (codec.plfreq / 1000 > 0) { 3038 sinfo.jitter_ms = iter->interarrival_jitter / (codec.plfreq / 1000); 3039 } 3040 sinfo.packets_lost = iter->cumulative_num_packets_lost; 3041 sinfo.ext_seqnum = iter->extended_highest_sequence_number; 3042 break; 3043 } 3044 } 3045 } 3046 3047 // Local speech level. 3048 sinfo.audio_level = (engine()->voe()->volume()-> 3049 GetSpeechInputLevelFullRange(level) != -1) ? level : -1; 3050 3051 // TODO(xians): We are injecting the same APM logging to all the send 3052 // channels here because there is no good way to know which send channel 3053 // is using the APM. The correct fix is to allow the send channels to have 3054 // their own APM so that we can feed the correct APM logging to different 3055 // send channels. See issue crbug/264611 . 3056 sinfo.echo_return_loss = echo_return_loss; 3057 sinfo.echo_return_loss_enhancement = echo_return_loss_enhancement; 3058 sinfo.echo_delay_median_ms = echo_delay_median_ms; 3059 sinfo.echo_delay_std_ms = echo_delay_std_ms; 3060 // TODO(ajm): Re-enable this metric once we have a reliable implementation. 3061 sinfo.aec_quality_min = -1; 3062 sinfo.typing_noise_detected = typing_noise_detected_; 3063 3064 info->senders.push_back(sinfo); 3065 } 3066 3067 // Build the list of receivers, one for each receiving channel, or 1 in 3068 // a 1:1 call. 3069 std::vector<int> channels; 3070 for (ChannelMap::const_iterator it = receive_channels_.begin(); 3071 it != receive_channels_.end(); ++it) { 3072 channels.push_back(it->second.channel); 3073 } 3074 if (channels.empty()) { 3075 channels.push_back(voe_channel()); 3076 } 3077 3078 // Get the SSRC and stats for each receiver, based on our own calculations. 3079 for (std::vector<int>::const_iterator it = channels.begin(); 3080 it != channels.end(); ++it) { 3081 memset(&cs, 0, sizeof(cs)); 3082 if (engine()->voe()->rtp()->GetRemoteSSRC(*it, ssrc) != -1 && 3083 engine()->voe()->rtp()->GetRTCPStatistics(*it, cs) != -1 && 3084 engine()->voe()->codec()->GetRecCodec(*it, codec) != -1) { 3085 VoiceReceiverInfo rinfo; 3086 rinfo.add_ssrc(ssrc); 3087 rinfo.bytes_rcvd = cs.bytesReceived; 3088 rinfo.packets_rcvd = cs.packetsReceived; 3089 // The next four fields are from the most recently sent RTCP report. 3090 // Convert Q8 to floating point. 3091 rinfo.fraction_lost = static_cast<float>(cs.fractionLost) / (1 << 8); 3092 rinfo.packets_lost = cs.cumulativeLost; 3093 rinfo.ext_seqnum = cs.extendedMax; 3094 // Convert samples to milliseconds. 3095 if (codec.plfreq / 1000 > 0) { 3096 rinfo.jitter_ms = cs.jitterSamples / (codec.plfreq / 1000); 3097 } 3098 3099 // Get jitter buffer and total delay (alg + jitter + playout) stats. 3100 webrtc::NetworkStatistics ns; 3101 if (engine()->voe()->neteq() && 3102 engine()->voe()->neteq()->GetNetworkStatistics( 3103 *it, ns) != -1) { 3104 rinfo.jitter_buffer_ms = ns.currentBufferSize; 3105 rinfo.jitter_buffer_preferred_ms = ns.preferredBufferSize; 3106 rinfo.expand_rate = 3107 static_cast<float>(ns.currentExpandRate) / (1 << 14); 3108 } 3109 if (engine()->voe()->sync()) { 3110 int jitter_buffer_delay_ms = 0; 3111 int playout_buffer_delay_ms = 0; 3112 engine()->voe()->sync()->GetDelayEstimate( 3113 *it, &jitter_buffer_delay_ms, &playout_buffer_delay_ms); 3114 rinfo.delay_estimate_ms = jitter_buffer_delay_ms + 3115 playout_buffer_delay_ms; 3116 } 3117 3118 // Get speech level. 3119 rinfo.audio_level = (engine()->voe()->volume()-> 3120 GetSpeechOutputLevelFullRange(*it, level) != -1) ? level : -1; 3121 info->receivers.push_back(rinfo); 3122 } 3123 } 3124 3125 return true; 3126 } 3127 3128 void WebRtcVoiceMediaChannel::GetLastMediaError( 3129 uint32* ssrc, VoiceMediaChannel::Error* error) { 3130 ASSERT(ssrc != NULL); 3131 ASSERT(error != NULL); 3132 FindSsrc(voe_channel(), ssrc); 3133 *error = WebRtcErrorToChannelError(GetLastEngineError()); 3134 } 3135 3136 bool WebRtcVoiceMediaChannel::FindSsrc(int channel_num, uint32* ssrc) { 3137 talk_base::CritScope lock(&receive_channels_cs_); 3138 ASSERT(ssrc != NULL); 3139 if (channel_num == -1 && send_ != SEND_NOTHING) { 3140 // Sometimes the VoiceEngine core will throw error with channel_num = -1. 3141 // This means the error is not limited to a specific channel. Signal the 3142 // message using ssrc=0. If the current channel is sending, use this 3143 // channel for sending the message. 3144 *ssrc = 0; 3145 return true; 3146 } else { 3147 // Check whether this is a sending channel. 3148 for (ChannelMap::const_iterator it = send_channels_.begin(); 3149 it != send_channels_.end(); ++it) { 3150 if (it->second.channel == channel_num) { 3151 // This is a sending channel. 3152 uint32 local_ssrc = 0; 3153 if (engine()->voe()->rtp()->GetLocalSSRC( 3154 channel_num, local_ssrc) != -1) { 3155 *ssrc = local_ssrc; 3156 } 3157 return true; 3158 } 3159 } 3160 3161 // Check whether this is a receiving channel. 3162 for (ChannelMap::const_iterator it = receive_channels_.begin(); 3163 it != receive_channels_.end(); ++it) { 3164 if (it->second.channel == channel_num) { 3165 *ssrc = it->first; 3166 return true; 3167 } 3168 } 3169 } 3170 return false; 3171 } 3172 3173 void WebRtcVoiceMediaChannel::OnError(uint32 ssrc, int error) { 3174 if (error == VE_TYPING_NOISE_WARNING) { 3175 typing_noise_detected_ = true; 3176 } else if (error == VE_TYPING_NOISE_OFF_WARNING) { 3177 typing_noise_detected_ = false; 3178 } 3179 SignalMediaError(ssrc, WebRtcErrorToChannelError(error)); 3180 } 3181 3182 int WebRtcVoiceMediaChannel::GetOutputLevel(int channel) { 3183 unsigned int ulevel; 3184 int ret = 3185 engine()->voe()->volume()->GetSpeechOutputLevel(channel, ulevel); 3186 return (ret == 0) ? static_cast<int>(ulevel) : -1; 3187 } 3188 3189 int WebRtcVoiceMediaChannel::GetReceiveChannelNum(uint32 ssrc) { 3190 ChannelMap::iterator it = receive_channels_.find(ssrc); 3191 if (it != receive_channels_.end()) 3192 return it->second.channel; 3193 return (ssrc == default_receive_ssrc_) ? voe_channel() : -1; 3194 } 3195 3196 int WebRtcVoiceMediaChannel::GetSendChannelNum(uint32 ssrc) { 3197 ChannelMap::iterator it = send_channels_.find(ssrc); 3198 if (it != send_channels_.end()) 3199 return it->second.channel; 3200 3201 return -1; 3202 } 3203 3204 bool WebRtcVoiceMediaChannel::GetRedSendCodec(const AudioCodec& red_codec, 3205 const std::vector<AudioCodec>& all_codecs, webrtc::CodecInst* send_codec) { 3206 // Get the RED encodings from the parameter with no name. This may 3207 // change based on what is discussed on the Jingle list. 3208 // The encoding parameter is of the form "a/b"; we only support where 3209 // a == b. Verify this and parse out the value into red_pt. 3210 // If the parameter value is absent (as it will be until we wire up the 3211 // signaling of this message), use the second codec specified (i.e. the 3212 // one after "red") as the encoding parameter. 3213 int red_pt = -1; 3214 std::string red_params; 3215 CodecParameterMap::const_iterator it = red_codec.params.find(""); 3216 if (it != red_codec.params.end()) { 3217 red_params = it->second; 3218 std::vector<std::string> red_pts; 3219 if (talk_base::split(red_params, '/', &red_pts) != 2 || 3220 red_pts[0] != red_pts[1] || 3221 !talk_base::FromString(red_pts[0], &red_pt)) { 3222 LOG(LS_WARNING) << "RED params " << red_params << " not supported."; 3223 return false; 3224 } 3225 } else if (red_codec.params.empty()) { 3226 LOG(LS_WARNING) << "RED params not present, using defaults"; 3227 if (all_codecs.size() > 1) { 3228 red_pt = all_codecs[1].id; 3229 } 3230 } 3231 3232 // Try to find red_pt in |codecs|. 3233 std::vector<AudioCodec>::const_iterator codec; 3234 for (codec = all_codecs.begin(); codec != all_codecs.end(); ++codec) { 3235 if (codec->id == red_pt) 3236 break; 3237 } 3238 3239 // If we find the right codec, that will be the codec we pass to 3240 // SetSendCodec, with the desired payload type. 3241 if (codec != all_codecs.end() && 3242 engine()->FindWebRtcCodec(*codec, send_codec)) { 3243 } else { 3244 LOG(LS_WARNING) << "RED params " << red_params << " are invalid."; 3245 return false; 3246 } 3247 3248 return true; 3249 } 3250 3251 bool WebRtcVoiceMediaChannel::EnableRtcp(int channel) { 3252 if (engine()->voe()->rtp()->SetRTCPStatus(channel, true) == -1) { 3253 LOG_RTCERR2(SetRTCPStatus, channel, 1); 3254 return false; 3255 } 3256 // TODO(juberti): Enable VQMon and RTCP XR reports, once we know what 3257 // what we want to do with them. 3258 // engine()->voe().EnableVQMon(voe_channel(), true); 3259 // engine()->voe().EnableRTCP_XR(voe_channel(), true); 3260 return true; 3261 } 3262 3263 bool WebRtcVoiceMediaChannel::ResetRecvCodecs(int channel) { 3264 int ncodecs = engine()->voe()->codec()->NumOfCodecs(); 3265 for (int i = 0; i < ncodecs; ++i) { 3266 webrtc::CodecInst voe_codec; 3267 if (engine()->voe()->codec()->GetCodec(i, voe_codec) != -1) { 3268 voe_codec.pltype = -1; 3269 if (engine()->voe()->codec()->SetRecPayloadType( 3270 channel, voe_codec) == -1) { 3271 LOG_RTCERR2(SetRecPayloadType, channel, ToString(voe_codec)); 3272 return false; 3273 } 3274 } 3275 } 3276 return true; 3277 } 3278 3279 bool WebRtcVoiceMediaChannel::SetPlayout(int channel, bool playout) { 3280 if (playout) { 3281 LOG(LS_INFO) << "Starting playout for channel #" << channel; 3282 if (engine()->voe()->base()->StartPlayout(channel) == -1) { 3283 LOG_RTCERR1(StartPlayout, channel); 3284 return false; 3285 } 3286 } else { 3287 LOG(LS_INFO) << "Stopping playout for channel #" << channel; 3288 engine()->voe()->base()->StopPlayout(channel); 3289 } 3290 return true; 3291 } 3292 3293 uint32 WebRtcVoiceMediaChannel::ParseSsrc(const void* data, size_t len, 3294 bool rtcp) { 3295 size_t ssrc_pos = (!rtcp) ? 8 : 4; 3296 uint32 ssrc = 0; 3297 if (len >= (ssrc_pos + sizeof(ssrc))) { 3298 ssrc = talk_base::GetBE32(static_cast<const char*>(data) + ssrc_pos); 3299 } 3300 return ssrc; 3301 } 3302 3303 // Convert VoiceEngine error code into VoiceMediaChannel::Error enum. 3304 VoiceMediaChannel::Error 3305 WebRtcVoiceMediaChannel::WebRtcErrorToChannelError(int err_code) { 3306 switch (err_code) { 3307 case 0: 3308 return ERROR_NONE; 3309 case VE_CANNOT_START_RECORDING: 3310 case VE_MIC_VOL_ERROR: 3311 case VE_GET_MIC_VOL_ERROR: 3312 case VE_CANNOT_ACCESS_MIC_VOL: 3313 return ERROR_REC_DEVICE_OPEN_FAILED; 3314 case VE_SATURATION_WARNING: 3315 return ERROR_REC_DEVICE_SATURATION; 3316 case VE_REC_DEVICE_REMOVED: 3317 return ERROR_REC_DEVICE_REMOVED; 3318 case VE_RUNTIME_REC_WARNING: 3319 case VE_RUNTIME_REC_ERROR: 3320 return ERROR_REC_RUNTIME_ERROR; 3321 case VE_CANNOT_START_PLAYOUT: 3322 case VE_SPEAKER_VOL_ERROR: 3323 case VE_GET_SPEAKER_VOL_ERROR: 3324 case VE_CANNOT_ACCESS_SPEAKER_VOL: 3325 return ERROR_PLAY_DEVICE_OPEN_FAILED; 3326 case VE_RUNTIME_PLAY_WARNING: 3327 case VE_RUNTIME_PLAY_ERROR: 3328 return ERROR_PLAY_RUNTIME_ERROR; 3329 case VE_TYPING_NOISE_WARNING: 3330 return ERROR_REC_TYPING_NOISE_DETECTED; 3331 default: 3332 return VoiceMediaChannel::ERROR_OTHER; 3333 } 3334 } 3335 3336 int WebRtcSoundclipStream::Read(void *buf, int len) { 3337 size_t res = 0; 3338 mem_.Read(buf, len, &res, NULL); 3339 return static_cast<int>(res); 3340 } 3341 3342 int WebRtcSoundclipStream::Rewind() { 3343 mem_.Rewind(); 3344 // Return -1 to keep VoiceEngine from looping. 3345 return (loop_) ? 0 : -1; 3346 } 3347 3348 } // namespace cricket 3349 3350 #endif // HAVE_WEBRTC_VOICE 3351