use of int16_t/uint16_t. This is the upshot of a recommendation by henrik.lundin and kwiberg on an original small change ( https://webrtc-codereview.appspot.com/42569004/#ps1 ) to stop using int16_t just because values could fit in it, and is similar in nature to a previous "mass change to use size_t more" ( https://webrtc-codereview.appspot.com/23129004/ ) which also needed to be split up for review but to land all at once, since, like adding "const", such changes tend to cause a lot of transitive effects. This was be reviewed and approved in pieces: https://codereview.webrtc.org/1224093003 https://codereview.webrtc.org/1224123002 https://codereview.webrtc.org/1224163002 https://codereview.webrtc.org/1225133003 https://codereview.webrtc.org/1225173002 https://codereview.webrtc.org/1227163003 https://codereview.webrtc.org/1227203003 https://codereview.webrtc.org/1227213002 https://codereview.webrtc.org/1227893002 https://codereview.webrtc.org/1228793004 https://codereview.webrtc.org/1228803003 https://codereview.webrtc.org/1228823002 https://codereview.webrtc.org/1228823003 https://codereview.webrtc.org/1228843002 https://codereview.webrtc.org/1230693002 https://codereview.webrtc.org/1231713002 The change is being landed as TBR to all the folks who reviewed the above. BUG=chromium:81439 TEST=none R=andrew@webrtc.org, pbos@webrtc.org TBR=aluebs, andrew, asapersson, henrika, hlundin, jan.skoglund, kwiberg, minyue, pbos, pthatcher Review URL: https://codereview.webrtc.org/1230503003 . Cr-Commit-Position: refs/heads/master@{#9768}
60 lines
2.1 KiB
C++
60 lines
2.1 KiB
C++
/*
|
|
* Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
|
|
*
|
|
* Use of this source code is governed by a BSD-style license
|
|
* that can be found in the LICENSE file in the root of the source
|
|
* tree. An additional intellectual property rights grant can be found
|
|
* in the file PATENTS. All contributing project authors may
|
|
* be found in the AUTHORS file in the root of the source tree.
|
|
*/
|
|
|
|
// Modified from the Chromium original:
|
|
// src/media/base/simd/sinc_resampler_sse.cc
|
|
|
|
#include "webrtc/common_audio/resampler/sinc_resampler.h"
|
|
|
|
#include <xmmintrin.h>
|
|
|
|
namespace webrtc {
|
|
|
|
float SincResampler::Convolve_SSE(const float* input_ptr, const float* k1,
|
|
const float* k2,
|
|
double kernel_interpolation_factor) {
|
|
__m128 m_input;
|
|
__m128 m_sums1 = _mm_setzero_ps();
|
|
__m128 m_sums2 = _mm_setzero_ps();
|
|
|
|
// Based on |input_ptr| alignment, we need to use loadu or load. Unrolling
|
|
// these loops hurt performance in local testing.
|
|
if (reinterpret_cast<uintptr_t>(input_ptr) & 0x0F) {
|
|
for (size_t i = 0; i < kKernelSize; i += 4) {
|
|
m_input = _mm_loadu_ps(input_ptr + i);
|
|
m_sums1 = _mm_add_ps(m_sums1, _mm_mul_ps(m_input, _mm_load_ps(k1 + i)));
|
|
m_sums2 = _mm_add_ps(m_sums2, _mm_mul_ps(m_input, _mm_load_ps(k2 + i)));
|
|
}
|
|
} else {
|
|
for (size_t i = 0; i < kKernelSize; i += 4) {
|
|
m_input = _mm_load_ps(input_ptr + i);
|
|
m_sums1 = _mm_add_ps(m_sums1, _mm_mul_ps(m_input, _mm_load_ps(k1 + i)));
|
|
m_sums2 = _mm_add_ps(m_sums2, _mm_mul_ps(m_input, _mm_load_ps(k2 + i)));
|
|
}
|
|
}
|
|
|
|
// Linearly interpolate the two "convolutions".
|
|
m_sums1 = _mm_mul_ps(m_sums1, _mm_set_ps1(
|
|
static_cast<float>(1.0 - kernel_interpolation_factor)));
|
|
m_sums2 = _mm_mul_ps(m_sums2, _mm_set_ps1(
|
|
static_cast<float>(kernel_interpolation_factor)));
|
|
m_sums1 = _mm_add_ps(m_sums1, m_sums2);
|
|
|
|
// Sum components together.
|
|
float result;
|
|
m_sums2 = _mm_add_ps(_mm_movehl_ps(m_sums1, m_sums1), m_sums1);
|
|
_mm_store_ss(&result, _mm_add_ss(m_sums2, _mm_shuffle_ps(
|
|
m_sums2, m_sums2, 1)));
|
|
|
|
return result;
|
|
}
|
|
|
|
} // namespace webrtc
|