Commit 8e8db16a authored by Rong Yan's avatar Rong Yan Committed by Michael Niedermayer
Browse files

avutil/ppc/float_dsp_altivec: ppc: Fix bug in ff_vector_fmul_add_altivec()...

avutil/ppc/float_dsp_altivec: ppc: Fix bug in ff_vector_fmul_add_altivec() affecting little endian environments on POWER8
Signed-off-by: default avatarMichael Niedermayer <michaelni@gmx.at>
parent 4a203b77
release/6.1 n7.1-dev n7.0.2 n7.0.1 n7.0 n6.2-dev n6.1.2 n6.1.1 n6.1 n6.1-dev n6.0.1 n6.0 n5.2-dev n5.1.6 n5.1.5 n5.1.4 n5.1.3 n5.1.2 n5.1.1 n5.1 n5.1-dev n5.0.3 n5.0.2 n5.0.1 n5.0 n4.5-dev n4.4.5 n4.4.4 n4.4.3 n4.4.2 n4.4.1 n4.4 n4.4-dev n4.3.8 n4.3.7 n4.3.6 n4.3.5 n4.3.4 n4.3.3 n4.3.2 n4.3.1 n4.3 n4.3-dev n4.2.10 n4.2.9 n4.2.8 n4.2.7 n4.2.6 n4.2.5 n4.2.4 n4.2.3 n4.2.2 n4.2.1 n4.2 n4.2-dev n4.1.11 n4.1.10 n4.1.9 n4.1.8 n4.1.7 n4.1.6 n4.1.5 n4.1.4 n4.1.3 n4.1.2 n4.1.1 n4.1 n4.1-dev n4.0.6 n4.0.5 n4.0.4 n4.0.3 n4.0.2 n4.0.1 n4.0 n3.5-dev n3.4.13 n3.4.12 n3.4.11 n3.4.10 n3.4.9 n3.4.8 n3.4.7 n3.4.6 n3.4.5 n3.4.4 n3.4.3 n3.4.2 n3.4.1 n3.4 n3.4-dev n3.3.9 n3.3.8 n3.3.7 n3.3.6 n3.3.5 n3.3.4 n3.3.3 n3.3.2 n3.3.1 n3.3 n3.3-dev n3.2.19 n3.2.18 n3.2.17 n3.2.16 n3.2.15 n3.2.14 n3.2.13 n3.2.12 n3.2.11 n3.2.10 n3.2.9 n3.2.8 n3.2.7 n3.2.6 n3.2.5 n3.2.4 n3.2.3 n3.2.2 n3.2.1 n3.2 n3.2-dev n3.1.11 n3.1.10 n3.1.9 n3.1.8 n3.1.7 n3.1.6 n3.1.5 n3.1.4 n3.1.3 n3.1.2 n3.1.1 n3.1 n3.1-dev n3.0.12 n3.0.11 n3.0.10 n3.0.9 n3.0.8 n3.0.7 n3.0.6 n3.0.5 n3.0.4 n3.0.3 n3.0.2 n3.0.1 n3.0 n2.9-dev n2.8.22 n2.8.21 n2.8.20 n2.8.19 n2.8.18 n2.8.17 n2.8.16 n2.8.15 n2.8.14 n2.8.13 n2.8.12 n2.8.11 n2.8.10 n2.8.9 n2.8.8 n2.8.7 n2.8.6 n2.8.5 n2.8.4 n2.8.3 n2.8.2 n2.8.1 n2.8 n2.8-dev n2.7.7 n2.7.6 n2.7.5 n2.7.4 n2.7.3 n2.7.2 n2.7.1 n2.7 n2.7-dev n2.6.9 n2.6.8 n2.6.7 n2.6.6 n2.6.5 n2.6.4 n2.6.3 n2.6.2 n2.6.1 n2.6 n2.6-dev n2.5.11 n2.5.10 n2.5.9 n2.5.8 n2.5.7 n2.5.6 n2.5.5 n2.5.4 n2.5.3 n2.5.2 n2.5.1 n2.5 n2.5-dev n2.4.14 n2.4.13 n2.4.12 n2.4.11 n2.4.10 n2.4.9 n2.4.8 n2.4.7 n2.4.6 n2.4.5 n2.4.4 n2.4.3 n2.4.2 n2.4.1 n2.4
No related merge requests found
Showing with 8 additions and 10 deletions
+8 -10
......@@ -75,20 +75,18 @@ void ff_vector_fmul_add_altivec(float *dst, const float *src0,
int len)
{
int i;
vector float d, s0, s1, s2, t0, t1, edges;
vector unsigned char align = vec_lvsr(0,dst),
mask = vec_lvsl(0, dst);
vector float d, ss0, ss1, ss2, t0, t1, edges;
for (i = 0; i < len - 3; i += 4) {
t0 = vec_ld(0, dst + i);
t1 = vec_ld(15, dst + i);
s0 = vec_ld(0, src0 + i);
s1 = vec_ld(0, src1 + i);
s2 = vec_ld(0, src2 + i);
edges = vec_perm(t1, t0, mask);
d = vec_madd(s0, s1, s2);
t1 = vec_perm(d, edges, align);
t0 = vec_perm(edges, d, align);
ss0 = vec_ld(0, src0 + i);
ss1 = vec_ld(0, src1 + i);
ss2 = vec_ld(0, src2 + i);
edges = vec_perm(t1, t0, vcprm(0, 1, 2, 3));
d = vec_madd(ss0, ss1, ss2);
t1 = vec_perm(d, edges, vcprm(s0,s1,s2,s3));
t0 = vec_perm(edges, d, vcprm(s0,s1,s2,s3));
vec_st(t1, 15, dst + i);
vec_st(t0, 0, dst + i);
}
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment