Implementing stereo support for G.722
This CL implements stereo support for G.722 through a new class AudioDecoderG722Stereo derived from AudioDecoderG722. Also implementing tests for G.722 stereo. Review URL: https://webrtc-codereview.appspot.com/1073006 git-svn-id: http://webrtc.googlecode.com/svn/trunk@3452 4adac7df-926f-26a2-2b94-8c16560cd09d
This commit is contained in:
@ -12,6 +12,8 @@
|
||||
|
||||
#include <assert.h>
|
||||
|
||||
#include <cstring> // memmove
|
||||
|
||||
#include "webrtc/modules/audio_coding/codecs/cng/include/webrtc_cng.h"
|
||||
#include "webrtc/modules/audio_coding/codecs/g711/include/g711_interface.h"
|
||||
#ifdef WEBRTC_CODEC_G722
|
||||
@ -287,6 +289,90 @@ int AudioDecoderG722::PacketDuration(const uint8_t* encoded,
|
||||
// 1/2 encoded byte per sample per channel.
|
||||
return 2 * encoded_len / channels_;
|
||||
}
|
||||
|
||||
AudioDecoderG722Stereo::AudioDecoderG722Stereo()
|
||||
: AudioDecoderG722(),
|
||||
state_left_(state_), // Base member |state_| is used for left channel.
|
||||
state_right_(NULL) {
|
||||
channels_ = 2;
|
||||
// |state_left_| already created by the base class AudioDecoderG722.
|
||||
WebRtcG722_CreateDecoder(reinterpret_cast<G722DecInst**>(&state_right_));
|
||||
}
|
||||
|
||||
AudioDecoderG722Stereo::~AudioDecoderG722Stereo() {
|
||||
// |state_left_| will be freed by the base class AudioDecoderG722.
|
||||
WebRtcG722_FreeDecoder(static_cast<G722DecInst*>(state_right_));
|
||||
}
|
||||
|
||||
int AudioDecoderG722Stereo::Decode(const uint8_t* encoded, size_t encoded_len,
|
||||
int16_t* decoded, SpeechType* speech_type) {
|
||||
int16_t temp_type = 1; // Default is speech.
|
||||
// De-interleave the bit-stream into two separate payloads.
|
||||
uint8_t* encoded_deinterleaved = new uint8_t[encoded_len];
|
||||
SplitStereoPacket(encoded, encoded_len, encoded_deinterleaved);
|
||||
// Decode left and right.
|
||||
int16_t ret = WebRtcG722_Decode(
|
||||
static_cast<G722DecInst*>(state_left_),
|
||||
reinterpret_cast<int16_t*>(encoded_deinterleaved),
|
||||
static_cast<int16_t>(encoded_len / 2), decoded, &temp_type);
|
||||
if (ret >= 0) {
|
||||
int decoded_len = ret;
|
||||
ret = WebRtcG722_Decode(
|
||||
static_cast<G722DecInst*>(state_right_),
|
||||
reinterpret_cast<int16_t*>(&encoded_deinterleaved[encoded_len / 2]),
|
||||
static_cast<int16_t>(encoded_len / 2), &decoded[decoded_len], &temp_type);
|
||||
if (ret == decoded_len) {
|
||||
decoded_len += ret;
|
||||
// Interleave output.
|
||||
for (int k = decoded_len / 2; k < decoded_len; k++) {
|
||||
int16_t temp = decoded[k];
|
||||
memmove(&decoded[2 * k - decoded_len + 2],
|
||||
&decoded[2 * k - decoded_len + 1],
|
||||
(decoded_len - k - 1) * sizeof(int16_t));
|
||||
decoded[2 * k - decoded_len + 1] = temp;
|
||||
}
|
||||
ret = decoded_len; // Return total number of samples.
|
||||
}
|
||||
}
|
||||
*speech_type = ConvertSpeechType(temp_type);
|
||||
delete [] encoded_deinterleaved;
|
||||
return ret;
|
||||
}
|
||||
|
||||
int AudioDecoderG722Stereo::Init() {
|
||||
int ret = WebRtcG722_DecoderInit(static_cast<G722DecInst*>(state_right_));
|
||||
if (ret != 0) {
|
||||
return ret;
|
||||
}
|
||||
return AudioDecoderG722::Init();
|
||||
}
|
||||
|
||||
// Split the stereo packet and place left and right channel after each other
|
||||
// in the output array.
|
||||
void AudioDecoderG722Stereo::SplitStereoPacket(const uint8_t* encoded,
|
||||
size_t encoded_len,
|
||||
uint8_t* encoded_deinterleaved) {
|
||||
assert(encoded);
|
||||
// Regroup the 4 bits/sample so |l1 l2| |r1 r2| |l3 l4| |r3 r4| ...,
|
||||
// where "lx" is 4 bits representing left sample number x, and "rx" right
|
||||
// sample. Two samples fit in one byte, represented with |...|.
|
||||
for (size_t i = 0; i + 1 < encoded_len; i += 2) {
|
||||
uint8_t right_byte = ((encoded[i] & 0x0F) << 4) + (encoded[i + 1] & 0x0F);
|
||||
encoded_deinterleaved[i] = (encoded[i] & 0xF0) + (encoded[i + 1] >> 4);
|
||||
encoded_deinterleaved[i + 1] = right_byte;
|
||||
}
|
||||
|
||||
// Move one byte representing right channel each loop, and place it at the
|
||||
// end of the bytestream vector. After looping the data is reordered to:
|
||||
// |l1 l2| |l3 l4| ... |l(N-1) lN| |r1 r2| |r3 r4| ... |r(N-1) r(N)|,
|
||||
// where N is the total number of samples.
|
||||
for (size_t i = 0; i < encoded_len / 2; i++) {
|
||||
uint8_t right_byte = encoded_deinterleaved[i + 1];
|
||||
memmove(&encoded_deinterleaved[i + 1], &encoded_deinterleaved[i + 2],
|
||||
encoded_len - i - 2);
|
||||
encoded_deinterleaved[encoded_len - 1] = right_byte;
|
||||
}
|
||||
}
|
||||
#endif
|
||||
|
||||
// Opus
|
||||
|
||||
Reference in New Issue
Block a user