Go to the documentation of this file.
36 static void lpc_compute_autocorr_sse2(
const double *
data, ptrdiff_t
len,
int lag,
44 for(j=0; j<lag; j+=2){
48 "movsd "MANGLE(pd_1)
", %%xmm0 \n\t"
49 "movsd "MANGLE(pd_1)
", %%xmm1 \n\t"
50 "movsd "MANGLE(pd_1)
", %%xmm2 \n\t"
52 "movapd (%2,%0), %%xmm3 \n\t"
53 "movupd -8(%3,%0), %%xmm4 \n\t"
54 "movapd (%3,%0), %%xmm5 \n\t"
55 "mulpd %%xmm3, %%xmm4 \n\t"
56 "mulpd %%xmm3, %%xmm5 \n\t"
57 "mulpd -16(%3,%0), %%xmm3 \n\t"
58 "addpd %%xmm4, %%xmm1 \n\t"
59 "addpd %%xmm5, %%xmm0 \n\t"
60 "addpd %%xmm3, %%xmm2 \n\t"
63 "movhlps %%xmm0, %%xmm3 \n\t"
64 "movhlps %%xmm1, %%xmm4 \n\t"
65 "movhlps %%xmm2, %%xmm5 \n\t"
66 "addsd %%xmm3, %%xmm0 \n\t"
67 "addsd %%xmm4, %%xmm1 \n\t"
68 "addsd %%xmm5, %%xmm2 \n\t"
69 "movsd %%xmm0, (%1) \n\t"
70 "movsd %%xmm1, 8(%1) \n\t"
71 "movsd %%xmm2, 16(%1) \n\t"
79 "movsd "MANGLE(pd_1)
", %%xmm0 \n\t"
80 "movsd "MANGLE(pd_1)
", %%xmm1 \n\t"
82 "movapd (%3,%0), %%xmm3 \n\t"
83 "movupd -8(%4,%0), %%xmm4 \n\t"
84 "mulpd %%xmm3, %%xmm4 \n\t"
85 "mulpd (%4,%0), %%xmm3 \n\t"
86 "addpd %%xmm4, %%xmm1 \n\t"
87 "addpd %%xmm3, %%xmm0 \n\t"
90 "movhlps %%xmm0, %%xmm3 \n\t"
91 "movhlps %%xmm1, %%xmm4 \n\t"
92 "addsd %%xmm3, %%xmm0 \n\t"
93 "addsd %%xmm4, %%xmm1 \n\t"
94 "movsd %%xmm0, %1 \n\t"
95 "movsd %%xmm1, %2 \n\t"
96 :
"+&r"(
i),
"=m"(autoc[j]),
"=m"(autoc[j+1])
112 c->lpc_compute_autocorr = lpc_compute_autocorr_sse2;
DECLARE_ASM_CONST(16, double, pd_1)[2]
int av_get_cpu_flags(void)
Return the flags which specify extensions supported by the CPU.
static atomic_int cpu_flags
void ff_lpc_apply_welch_window_sse2(const int32_t *data, ptrdiff_t len, double *w_data)
av_cold void ff_lpc_init_x86(LPCContext *c)
#define EXTERNAL_AVX2(flags)
#define NAMED_CONSTRAINTS_ARRAY_ADD(...)
Undefined Behavior In the C some operations are like signed integer dereferencing freed accessing outside allocated Undefined Behavior must not occur in a C it is not safe even if the output of undefined operations is unused The unsafety may seem nit picking but Optimizing compilers have in fact optimized code on the assumption that no undefined Behavior occurs Optimizing code based on wrong assumptions can and has in some cases lead to effects beyond the output of computations The signed integer overflow problem in speed critical code Code which is highly optimized and works with signed integers sometimes has the problem that often the output of the computation does not c
#define EXTERNAL_SSE2(flags)
#define i(width, name, range_min, range_max)
void ff_lpc_apply_welch_window_avx2(const int32_t *data, ptrdiff_t len, double *w_data)
__asm__(".macro parse_r var r\n\t" "\\var = -1\n\t" _IFC_REG(0) _IFC_REG(1) _IFC_REG(2) _IFC_REG(3) _IFC_REG(4) _IFC_REG(5) _IFC_REG(6) _IFC_REG(7) _IFC_REG(8) _IFC_REG(9) _IFC_REG(10) _IFC_REG(11) _IFC_REG(12) _IFC_REG(13) _IFC_REG(14) _IFC_REG(15) _IFC_REG(16) _IFC_REG(17) _IFC_REG(18) _IFC_REG(19) _IFC_REG(20) _IFC_REG(21) _IFC_REG(22) _IFC_REG(23) _IFC_REG(24) _IFC_REG(25) _IFC_REG(26) _IFC_REG(27) _IFC_REG(28) _IFC_REG(29) _IFC_REG(30) _IFC_REG(31) ".iflt \\var\n\t" ".error \"Unable to parse register name \\r\"\n\t" ".endif\n\t" ".endm")
#define INLINE_SSE2_SLOW(flags)