|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
#include "common.h" |
|
#include "fixed_dsp.h" |
|
|
|
static void vector_fmul_add_c(int *dst, const int *src0, const int *src1, const int *src2, int len){ |
|
int i; |
|
int64_t accu; |
|
|
|
for (i=0; i<len; i++) { |
|
accu = (int64_t)src0[i] * src1[i]; |
|
dst[i] = src2[i] + (int)((accu + 0x40000000) >> 31); |
|
} |
|
} |
|
|
|
static void vector_fmul_reverse_c(int *dst, const int *src0, const int *src1, int len) |
|
{ |
|
int i; |
|
int64_t accu; |
|
|
|
src1 += len-1; |
|
for (i=0; i<len; i++) { |
|
accu = (int64_t)src0[i] * src1[-i]; |
|
dst[i] = (int)((accu+0x40000000) >> 31); |
|
} |
|
} |
|
|
|
static void vector_fmul_window_scaled_c(int16_t *dst, const int32_t *src0, |
|
const int32_t *src1, const int32_t *win, |
|
int len, uint8_t bits) |
|
{ |
|
int32_t s0, s1, wi, wj, i,j, round; |
|
|
|
dst += len; |
|
win += len; |
|
src0+= len; |
|
round = bits? 1 << (bits-1) : 0; |
|
|
|
for (i=-len, j=len-1; i<0; i++, j--) { |
|
s0 = src0[i]; |
|
s1 = src1[j]; |
|
wi = win[i]; |
|
wj = win[j]; |
|
dst[i] = av_clip_int16(((((int64_t)s0*wj - (int64_t)s1*wi + 0x40000000) >> 31) + round) >> bits); |
|
dst[j] = av_clip_int16(((((int64_t)s0*wi + (int64_t)s1*wj + 0x40000000) >> 31) + round) >> bits); |
|
} |
|
} |
|
|
|
static void vector_fmul_window_c(int32_t *dst, const int32_t *src0, |
|
const int32_t *src1, const int32_t *win, |
|
int len) |
|
{ |
|
int32_t s0, s1, wi, wj, i, j; |
|
|
|
dst += len; |
|
win += len; |
|
src0+= len; |
|
|
|
for (i=-len, j=len-1; i<0; i++, j--) { |
|
s0 = src0[i]; |
|
s1 = src1[j]; |
|
wi = win[i]; |
|
wj = win[j]; |
|
dst[i] = ((int64_t)s0*wj - (int64_t)s1*wi + 0x40000000) >> 31; |
|
dst[j] = ((int64_t)s0*wi + (int64_t)s1*wj + 0x40000000) >> 31; |
|
} |
|
} |
|
|
|
static void vector_fmul_c(int *dst, const int *src0, const int *src1, int len) |
|
{ |
|
int i; |
|
int64_t accu; |
|
|
|
for (i = 0; i < len; i++){ |
|
accu = (int64_t)src0[i] * src1[i]; |
|
dst[i] = (int)((accu+0x40000000) >> 31); |
|
} |
|
} |
|
|
|
static int scalarproduct_fixed_c(const int *v1, const int *v2, int len) |
|
{ |
|
|
|
|
|
int64_t p = 0x40000000; |
|
int i; |
|
|
|
for (i = 0; i < len; i++) |
|
p += (int64_t)v1[i] * v2[i]; |
|
|
|
return (int)(p >> 31); |
|
} |
|
|
|
static void butterflies_fixed_c(int *av_restrict v1s, int *av_restrict v2, int len) |
|
{ |
|
int i; |
|
unsigned int *v1 = v1s; |
|
|
|
for (i = 0; i < len; i++){ |
|
int t = v1[i] - v2[i]; |
|
v1[i] += v2[i]; |
|
v2[i] = t; |
|
} |
|
} |
|
|
|
AVFixedDSPContext * avpriv_alloc_fixed_dsp(int bit_exact) |
|
{ |
|
AVFixedDSPContext * fdsp = av_malloc(sizeof(AVFixedDSPContext)); |
|
|
|
if (!fdsp) |
|
return NULL; |
|
|
|
fdsp->vector_fmul_window_scaled = vector_fmul_window_scaled_c; |
|
fdsp->vector_fmul_window = vector_fmul_window_c; |
|
fdsp->vector_fmul = vector_fmul_c; |
|
fdsp->vector_fmul_add = vector_fmul_add_c; |
|
fdsp->vector_fmul_reverse = vector_fmul_reverse_c; |
|
fdsp->butterflies_fixed = butterflies_fixed_c; |
|
fdsp->scalarproduct_fixed = scalarproduct_fixed_c; |
|
|
|
#if ARCH_RISCV |
|
ff_fixed_dsp_init_riscv(fdsp); |
|
#elif ARCH_X86 |
|
ff_fixed_dsp_init_x86(fdsp); |
|
#endif |
|
|
|
return fdsp; |
|
} |
|
|