/* * libjingle * Copyright 2004 Google Inc. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions are met: * * 1. Redistributions of source code must retain the above copyright notice, * this list of conditions and the following disclaimer. * 2. Redistributions in binary form must reproduce the above copyright notice, * this list of conditions and the following disclaimer in the documentation * and/or other materials provided with the distribution. * 3. The name of the author may not be used to endorse or promote products * derived from this software without specific prior written permission. * * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR IMPLIED * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO * EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. */ #ifndef TALK_MEDIA_WEBRTCVOICEENGINE_H_ #define TALK_MEDIA_WEBRTCVOICEENGINE_H_ #include #include #include #include #include "talk/media/base/rtputils.h" #include "talk/media/webrtc/webrtccommon.h" #include "talk/media/webrtc/webrtcvoe.h" #include "talk/session/media/channel.h" #include "webrtc/base/buffer.h" #include "webrtc/base/byteorder.h" #include "webrtc/base/logging.h" #include "webrtc/base/scoped_ptr.h" #include "webrtc/base/stream.h" #include "webrtc/base/thread_checker.h" #include "webrtc/call.h" #include "webrtc/common.h" #include "webrtc/config.h" namespace cricket { class AudioDeviceModule; class AudioRenderer; class VoETraceWrapper; class VoEWrapper; class WebRtcVoiceMediaChannel; // WebRtcVoiceEngine is a class to be used with CompositeMediaEngine. // It uses the WebRtc VoiceEngine library for audio handling. class WebRtcVoiceEngine : public webrtc::VoiceEngineObserver, public webrtc::TraceCallback { friend class WebRtcVoiceMediaChannel; public: WebRtcVoiceEngine(); // Dependency injection for testing. WebRtcVoiceEngine(VoEWrapper* voe_wrapper, VoETraceWrapper* tracing); ~WebRtcVoiceEngine(); bool Init(rtc::Thread* worker_thread); void Terminate(); webrtc::VoiceEngine* GetVoE() { return voe()->engine(); } VoiceMediaChannel* CreateChannel(webrtc::Call* call, const AudioOptions& options); AudioOptions GetOptions() const { return options_; } bool SetOptions(const AudioOptions& options); bool SetDevices(const Device* in_device, const Device* out_device); bool GetOutputVolume(int* level); bool SetOutputVolume(int level); int GetInputLevel(); const std::vector& codecs(); bool FindCodec(const AudioCodec& codec); bool FindWebRtcCodec(const AudioCodec& codec, webrtc::CodecInst* gcodec); const std::vector& rtp_header_extensions() const; void SetLogging(int min_sev, const char* filter); // For tracking WebRtc channels. Needed because we have to pause them // all when switching devices. // May only be called by WebRtcVoiceMediaChannel. void RegisterChannel(WebRtcVoiceMediaChannel* channel); void UnregisterChannel(WebRtcVoiceMediaChannel* channel); // Called by WebRtcVoiceMediaChannel to set a gain offset from // the default AGC target level. bool AdjustAgcLevel(int delta); VoEWrapper* voe() { return voe_wrapper_.get(); } int GetLastEngineError(); // Set the external ADM. This can only be called before Init. bool SetAudioDeviceModule(webrtc::AudioDeviceModule* adm); // Starts AEC dump using existing file. bool StartAecDump(rtc::PlatformFile file); // Stops AEC dump. void StopAecDump(); // Starts recording an RtcEventLog using an existing file until 10 minutes // pass or the StopRtcEventLog function is called. bool StartRtcEventLog(rtc::PlatformFile file); // Stops recording the RtcEventLog. void StopRtcEventLog(); private: void Construct(); void ConstructCodecs(); bool GetVoeCodec(int index, webrtc::CodecInst* codec); bool InitInternal(); void SetTraceFilter(int filter); void SetTraceOptions(const std::string& options); // Every option that is "set" will be applied. Every option not "set" will be // ignored. This allows us to selectively turn on and off different options // easily at any time. bool ApplyOptions(const AudioOptions& options); // webrtc::TraceCallback: void Print(webrtc::TraceLevel level, const char* trace, int length) override; // webrtc::VoiceEngineObserver: void CallbackOnError(int channel_id, int errCode) override; // Given the device type, name, and id, find device id. Return true and // set the output parameter rtc_id if successful. bool FindWebRtcAudioDeviceId( bool is_input, const std::string& dev_name, int dev_id, int* rtc_id); void StartAecDump(const std::string& filename); int CreateVoEChannel(); static const int kDefaultLogSeverity = rtc::LS_WARNING; // The primary instance of WebRtc VoiceEngine. rtc::scoped_ptr voe_wrapper_; rtc::scoped_ptr tracing_; // The external audio device manager webrtc::AudioDeviceModule* adm_; int log_filter_; std::string log_options_; bool is_dumping_aec_; std::vector codecs_; std::vector rtp_header_extensions_; std::vector channels_; // channels_ can be read from WebRtc callback thread. We need a lock on that // callback as well as the RegisterChannel/UnregisterChannel. rtc::CriticalSection channels_cs_; webrtc::AgcConfig default_agc_config_; webrtc::Config voe_config_; bool initialized_; AudioOptions options_; // Cache received extended_filter_aec, delay_agnostic_aec and experimental_ns // values, and apply them in case they are missing in the audio options. We // need to do this because SetExtraOptions() will revert to defaults for // options which are not provided. Settable extended_filter_aec_; Settable delay_agnostic_aec_; Settable experimental_ns_; RTC_DISALLOW_COPY_AND_ASSIGN(WebRtcVoiceEngine); }; // WebRtcVoiceMediaChannel is an implementation of VoiceMediaChannel that uses // WebRtc Voice Engine. class WebRtcVoiceMediaChannel : public VoiceMediaChannel, public webrtc::Transport { public: WebRtcVoiceMediaChannel(WebRtcVoiceEngine* engine, const AudioOptions& options, webrtc::Call* call); ~WebRtcVoiceMediaChannel() override; const AudioOptions& options() const { return options_; } bool SetSendParameters(const AudioSendParameters& params) override; bool SetRecvParameters(const AudioRecvParameters& params) override; bool SetPlayout(bool playout) override; bool PausePlayout(); bool ResumePlayout(); bool SetSend(SendFlags send) override; bool PauseSend(); bool ResumeSend(); bool SetAudioSend(uint32_t ssrc, bool enable, const AudioOptions* options, AudioRenderer* renderer) override; bool AddSendStream(const StreamParams& sp) override; bool RemoveSendStream(uint32_t ssrc) override; bool AddRecvStream(const StreamParams& sp) override; bool RemoveRecvStream(uint32_t ssrc) override; bool GetActiveStreams(AudioInfo::StreamList* actives) override; int GetOutputLevel() override; int GetTimeSinceLastTyping() override; void SetTypingDetectionParameters(int time_window, int cost_per_typing, int reporting_threshold, int penalty_decay, int type_event_delay) override; bool SetOutputVolume(uint32_t ssrc, double volume) override; bool CanInsertDtmf() override; bool InsertDtmf(uint32_t ssrc, int event, int duration, int flags) override; void OnPacketReceived(rtc::Buffer* packet, const rtc::PacketTime& packet_time) override; void OnRtcpReceived(rtc::Buffer* packet, const rtc::PacketTime& packet_time) override; void OnReadyToSend(bool ready) override {} bool GetStats(VoiceMediaInfo* info) override; // implements Transport interface bool SendRtp(const uint8_t* data, size_t len, const webrtc::PacketOptions& options) override { rtc::Buffer packet(reinterpret_cast(data), len, kMaxRtpPacketLen); rtc::PacketOptions rtc_options; rtc_options.packet_id = options.packet_id; return VoiceMediaChannel::SendPacket(&packet, rtc_options); } bool SendRtcp(const uint8_t* data, size_t len) override { rtc::Buffer packet(reinterpret_cast(data), len, kMaxRtpPacketLen); return VoiceMediaChannel::SendRtcp(&packet, rtc::PacketOptions()); } void OnError(int error); int GetReceiveChannelId(uint32_t ssrc) const; int GetSendChannelId(uint32_t ssrc) const; private: bool SetSendCodecs(const std::vector& codecs); bool SetSendRtpHeaderExtensions( const std::vector& extensions); bool SetOptions(const AudioOptions& options); bool SetMaxSendBandwidth(int bps); bool SetRecvCodecs(const std::vector& codecs); bool SetRecvRtpHeaderExtensions( const std::vector& extensions); bool SetLocalRenderer(uint32_t ssrc, AudioRenderer* renderer); bool MuteStream(uint32_t ssrc, bool mute); WebRtcVoiceEngine* engine() { return engine_; } int GetLastEngineError() { return engine()->GetLastEngineError(); } int GetOutputLevel(int channel); bool GetRedSendCodec(const AudioCodec& red_codec, const std::vector& all_codecs, webrtc::CodecInst* send_codec); bool SetPlayout(int channel, bool playout); static Error WebRtcErrorToChannelError(int err_code); typedef int (webrtc::VoERTP_RTCP::* ExtensionSetterFunction)(int, bool, unsigned char); void SetNack(int channel, bool nack_enabled); bool SetSendCodec(int channel, const webrtc::CodecInst& send_codec); bool ChangePlayout(bool playout); bool ChangeSend(SendFlags send); bool ChangeSend(int channel, SendFlags send); bool ConfigureRecvChannel(int channel); int CreateVoEChannel(); bool DeleteChannel(int channel); bool IsDefaultRecvStream(uint32_t ssrc) { return default_recv_ssrc_ == static_cast(ssrc); } bool SetSendCodecs(int channel, const std::vector& codecs); bool SetSendBitrateInternal(int bps); bool SetHeaderExtension(ExtensionSetterFunction setter, int channel_id, const RtpHeaderExtension* extension); void RecreateAudioReceiveStreams(); void AddAudioReceiveStream(uint32_t ssrc); void RemoveAudioReceiveStream(uint32_t ssrc); bool SetRecvCodecsInternal(const std::vector& new_codecs); bool SetChannelRecvRtpHeaderExtensions( int channel_id, const std::vector& extensions); bool SetChannelSendRtpHeaderExtensions( int channel_id, const std::vector& extensions); rtc::ThreadChecker thread_checker_; WebRtcVoiceEngine* const engine_; std::vector recv_codecs_; std::vector send_codecs_; rtc::scoped_ptr send_codec_; bool send_bitrate_setting_; int send_bitrate_bps_; AudioOptions options_; bool dtmf_allowed_; bool desired_playout_; bool nack_enabled_; bool playout_; bool typing_noise_detected_; SendFlags desired_send_; SendFlags send_; webrtc::Call* const call_; // SSRC of unsignalled receive stream, or -1 if there isn't one. int64_t default_recv_ssrc_ = -1; // Volume for unsignalled stream, which may be set before the stream exists. double default_recv_volume_ = 1.0; // SSRC to use for RTCP receiver reports; default to 1 in case of no signaled // send streams. See: https://code.google.com/p/webrtc/issues/detail?id=4740 uint32_t receiver_reports_ssrc_ = 1; class WebRtcAudioSendStream; std::map send_streams_; std::vector send_extensions_; class WebRtcAudioReceiveStream; std::map receive_channels_; std::map receive_streams_; std::map receive_stream_params_; // receive_channels_ can be read from WebRtc callback thread. Access from // the WebRtc thread must be synchronized with edits on the worker thread. // Reads on the worker thread are ok. std::vector receive_extensions_; std::vector recv_rtp_extensions_; RTC_DISALLOW_IMPLICIT_CONSTRUCTORS(WebRtcVoiceMediaChannel); }; } // namespace cricket #endif // TALK_MEDIA_WEBRTCVOICEENGINE_H_