ppsspp/ext/at3_standalone/float_dsp.h
Henrik Rydgård 090d1f8d0e atrac3: Add a cross platform restrict modifier, use it for the vector math functions
Also remove redundant parameters.

There are a bunch of other places where we could use this, so just
experimenting here.

This enables autovectorization to work here.
2024-05-02 16:57:15 +02:00

53 lines
1.8 KiB
C

/*
* This file is part of FFmpeg.
*
* FFmpeg is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License as published by the Free Software Foundation; either
* version 2.1 of the License, or (at your option) any later version.
*
* FFmpeg is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with FFmpeg; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
*/
#pragma once
#include "compat.h"
inline void vector_fmul(float * av_restrict dst, const float * av_restrict src, int len) {
for (int i = 0; i < len; i++)
dst[i] = dst[i] * src[i];
}
/**
* Multiply a vector of floats by a scalar float. Source and
* destination vectors must overlap exactly or not at all.
*/
inline void vector_fmul_scalar(float *dst, float mul, int len) {
for (int i = 0; i < len; i++)
dst[i] *= mul;
}
/**
* Calculate the entry wise product of two vectors of floats, and store the result
* in a vector of floats. The second vector of floats is iterated over
* in reverse order.
*
* @param dst output and first input vector
* constraints: 32-byte aligned
* @param src second input vector
* constraints: 32-byte aligned
* @param len number of elements in the input
* constraints: multiple of 16
*/
inline void vector_fmul_reverse(float * av_restrict dst, const float * av_restrict src, int len) {
src += len - 1;
for (int i = 0; i < len; i++)
dst[i] *= src[-i];
}