aboutsummaryrefslogtreecommitdiffstats
path: root/libavcodec/ppc/mathops.h
diff options
context:
space:
mode:
authorMåns Rullgård <mans@mansr.com>2009-05-11 02:41:50 +0000
committerMåns Rullgård <mans@mansr.com>2009-05-11 02:41:50 +0000
commit014b7ecb6643332af35251c751aebd04bac4bb1e (patch)
treec28c04906cdd6a0dca95a704f446e72f868927da /libavcodec/ppc/mathops.h
parent24ac50525a219d5451f5cd712a4557dcca50198a (diff)
downloadffmpeg-014b7ecb6643332af35251c751aebd04bac4bb1e.tar.gz
PPC: 32-bit asm for MAC64 and MLS64
GCC makes a mess of these operations, so give it a hand. 55% faster MP3 decoding on G4. Originally committed as revision 18794 to svn://svn.ffmpeg.org/ffmpeg/trunk
Diffstat (limited to 'libavcodec/ppc/mathops.h')
-rw-r--r--libavcodec/ppc/mathops.h30
1 files changed, 30 insertions, 0 deletions
diff --git a/libavcodec/ppc/mathops.h b/libavcodec/ppc/mathops.h
index 2b5a5c4eb0..a74fcfa792 100644
--- a/libavcodec/ppc/mathops.h
+++ b/libavcodec/ppc/mathops.h
@@ -44,4 +44,34 @@ static inline av_const int MULH(int a, int b){
return r;
}
+#if !HAVE_PPC64
+static inline av_const int64_t MAC64(int64_t d, int a, int b)
+{
+ union { uint64_t x; unsigned hl[2]; } x = { d };
+ int h, l;
+ __asm__ ("mullw %3, %4, %5 \n\t"
+ "mulhw %2, %4, %5 \n\t"
+ "addc %1, %1, %3 \n\t"
+ "adde %0, %0, %2 \n\t"
+ : "+r"(x.hl[0]), "+r"(x.hl[1]), "=&r"(h), "=&r"(l)
+ : "r"(a), "r"(b));
+ return x.x;
+}
+#define MAC64(d, a, b) ((d) = MAC64(d, a, b))
+
+static inline av_const int64_t MLS64(int64_t d, int a, int b)
+{
+ union { uint64_t x; unsigned hl[2]; } x = { d };
+ int h, l;
+ __asm__ ("mullw %3, %4, %5 \n\t"
+ "mulhw %2, %4, %5 \n\t"
+ "subfc %1, %3, %1 \n\t"
+ "subfe %0, %2, %0 \n\t"
+ : "+r"(x.hl[0]), "+r"(x.hl[1]), "=&r"(h), "=&r"(l)
+ : "r"(a), "r"(b));
+ return x.x;
+}
+#define MLS64(d, a, b) ((d) = MLS64(d, a, b))
+#endif
+
#endif /* AVCODEC_PPC_MATHOPS_H */