Commit 6f4775a8 authored by Max Kellermann's avatar Max Kellermann

pcm/Neon: apply bit shift during float->int conversion

Avoid multiplication. This is a speedup of 20%.
parent c7e2f558
...@@ -68,21 +68,16 @@ struct NeonFloatTo16 { ...@@ -68,21 +68,16 @@ struct NeonFloatTo16 {
static constexpr size_t BLOCK_SIZE = 16; static constexpr size_t BLOCK_SIZE = 16;
void Convert(int16_t *dst, const float *src, const size_t n) const { void Convert(int16_t *dst, const float *src, const size_t n) const {
const float32x4_t factor =
vdupq_n_f32(1 << (DstTraits::BITS - 1));
for (unsigned i = 0; i < n / BLOCK_SIZE; for (unsigned i = 0; i < n / BLOCK_SIZE;
++i, src += BLOCK_SIZE, dst += BLOCK_SIZE) { ++i, src += BLOCK_SIZE, dst += BLOCK_SIZE) {
/* load 16 float samples into 4 quad /* load 16 float samples into 4 quad
registers */ registers */
float32x4x4_t value = vld4q_f32(src); float32x4x4_t value = vld4q_f32(src);
/* apply factor */
neon_x4_b(vmulq_f32, value, value, factor);
/* convert to 32 bit integer */ /* convert to 32 bit integer */
int32x4x4_t ivalue; int32x4x4_t ivalue;
neon_x4_u(vcvtq_s32_f32, ivalue, value); neon_x4_b(vcvtq_n_s32_f32, ivalue, value,
DstTraits::BITS - 1);
/* convert to 16 bit integer with saturation */ /* convert to 16 bit integer with saturation */
int16x4x4_t nvalue; int16x4x4_t nvalue;
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment