audio_encoder_g722.cc revision 12cfc9b4dacd6942377df1f29a64bdbec591920e
1/* 2 * Copyright (c) 2014 The WebRTC project authors. All Rights Reserved. 3 * 4 * Use of this source code is governed by a BSD-style license 5 * that can be found in the LICENSE file in the root of the source 6 * tree. An additional intellectual property rights grant can be found 7 * in the file PATENTS. All contributing project authors may 8 * be found in the AUTHORS file in the root of the source tree. 9 */ 10 11#include "webrtc/modules/audio_coding/codecs/g722/include/audio_encoder_g722.h" 12 13#include <limits> 14#include "webrtc/base/checks.h" 15#include "webrtc/common_types.h" 16#include "webrtc/modules/audio_coding/codecs/g722/include/g722_interface.h" 17 18namespace webrtc { 19 20namespace { 21 22const size_t kSampleRateHz = 16000; 23 24AudioEncoderG722::Config CreateConfig(const CodecInst& codec_inst) { 25 AudioEncoderG722::Config config; 26 config.num_channels = codec_inst.channels; 27 config.frame_size_ms = codec_inst.pacsize / 16; 28 config.payload_type = codec_inst.pltype; 29 return config; 30} 31 32} // namespace 33 34bool AudioEncoderG722::Config::IsOk() const { 35 return (frame_size_ms > 0) && (frame_size_ms % 10 == 0) && 36 (num_channels >= 1); 37} 38 39AudioEncoderG722::AudioEncoderG722(const Config& config) 40 : num_channels_(config.num_channels), 41 payload_type_(config.payload_type), 42 num_10ms_frames_per_packet_( 43 static_cast<size_t>(config.frame_size_ms / 10)), 44 num_10ms_frames_buffered_(0), 45 first_timestamp_in_buffer_(0), 46 encoders_(new EncoderState[num_channels_]), 47 interleave_buffer_(2 * num_channels_) { 48 CHECK(config.IsOk()); 49 const size_t samples_per_channel = 50 kSampleRateHz / 100 * num_10ms_frames_per_packet_; 51 for (int i = 0; i < num_channels_; ++i) { 52 encoders_[i].speech_buffer.reset(new int16_t[samples_per_channel]); 53 encoders_[i].encoded_buffer.SetSize(samples_per_channel / 2); 54 } 55 Reset(); 56} 57 58AudioEncoderG722::AudioEncoderG722(const CodecInst& codec_inst) 59 : AudioEncoderG722(CreateConfig(codec_inst)) {} 60 61AudioEncoderG722::~AudioEncoderG722() = default; 62 63size_t AudioEncoderG722::MaxEncodedBytes() const { 64 return SamplesPerChannel() / 2 * num_channels_; 65} 66 67int AudioEncoderG722::SampleRateHz() const { 68 return kSampleRateHz; 69} 70 71int AudioEncoderG722::NumChannels() const { 72 return num_channels_; 73} 74 75int AudioEncoderG722::RtpTimestampRateHz() const { 76 // The RTP timestamp rate for G.722 is 8000 Hz, even though it is a 16 kHz 77 // codec. 78 return kSampleRateHz / 2; 79} 80 81size_t AudioEncoderG722::Num10MsFramesInNextPacket() const { 82 return num_10ms_frames_per_packet_; 83} 84 85size_t AudioEncoderG722::Max10MsFramesInAPacket() const { 86 return num_10ms_frames_per_packet_; 87} 88 89int AudioEncoderG722::GetTargetBitrate() const { 90 // 4 bits/sample, 16000 samples/s/channel. 91 return 64000 * NumChannels(); 92} 93 94AudioEncoder::EncodedInfo AudioEncoderG722::EncodeInternal( 95 uint32_t rtp_timestamp, 96 const int16_t* audio, 97 size_t max_encoded_bytes, 98 uint8_t* encoded) { 99 CHECK_GE(max_encoded_bytes, MaxEncodedBytes()); 100 101 if (num_10ms_frames_buffered_ == 0) 102 first_timestamp_in_buffer_ = rtp_timestamp; 103 104 // Deinterleave samples and save them in each channel's buffer. 105 const size_t start = kSampleRateHz / 100 * num_10ms_frames_buffered_; 106 for (size_t i = 0; i < kSampleRateHz / 100; ++i) 107 for (int j = 0; j < num_channels_; ++j) 108 encoders_[j].speech_buffer[start + i] = audio[i * num_channels_ + j]; 109 110 // If we don't yet have enough samples for a packet, we're done for now. 111 if (++num_10ms_frames_buffered_ < num_10ms_frames_per_packet_) { 112 return EncodedInfo(); 113 } 114 115 // Encode each channel separately. 116 CHECK_EQ(num_10ms_frames_buffered_, num_10ms_frames_per_packet_); 117 num_10ms_frames_buffered_ = 0; 118 const size_t samples_per_channel = SamplesPerChannel(); 119 for (int i = 0; i < num_channels_; ++i) { 120 const size_t encoded = WebRtcG722_Encode( 121 encoders_[i].encoder, encoders_[i].speech_buffer.get(), 122 samples_per_channel, encoders_[i].encoded_buffer.data()); 123 CHECK_EQ(encoded, samples_per_channel / 2); 124 } 125 126 // Interleave the encoded bytes of the different channels. Each separate 127 // channel and the interleaved stream encodes two samples per byte, most 128 // significant half first. 129 for (size_t i = 0; i < samples_per_channel / 2; ++i) { 130 for (int j = 0; j < num_channels_; ++j) { 131 uint8_t two_samples = encoders_[j].encoded_buffer.data()[i]; 132 interleave_buffer_.data()[j] = two_samples >> 4; 133 interleave_buffer_.data()[num_channels_ + j] = two_samples & 0xf; 134 } 135 for (int j = 0; j < num_channels_; ++j) 136 encoded[i * num_channels_ + j] = interleave_buffer_.data()[2 * j] << 4 | 137 interleave_buffer_.data()[2 * j + 1]; 138 } 139 EncodedInfo info; 140 info.encoded_bytes = samples_per_channel / 2 * num_channels_; 141 info.encoded_timestamp = first_timestamp_in_buffer_; 142 info.payload_type = payload_type_; 143 return info; 144} 145 146void AudioEncoderG722::Reset() { 147 num_10ms_frames_buffered_ = 0; 148 for (int i = 0; i < num_channels_; ++i) 149 CHECK_EQ(0, WebRtcG722_EncoderInit(encoders_[i].encoder)); 150} 151 152AudioEncoderG722::EncoderState::EncoderState() { 153 CHECK_EQ(0, WebRtcG722_CreateEncoder(&encoder)); 154} 155 156AudioEncoderG722::EncoderState::~EncoderState() { 157 CHECK_EQ(0, WebRtcG722_FreeEncoder(encoder)); 158} 159 160size_t AudioEncoderG722::SamplesPerChannel() const { 161 return kSampleRateHz / 100 * num_10ms_frames_per_packet_; 162} 163 164} // namespace webrtc 165