aboutsummaryrefslogtreecommitdiffstats
path: root/libavfilter/x86
diff options
context:
space:
mode:
authorTing Fu <ting.fu@intel.com>2019-09-18 15:05:35 +0800
committerRuiling Song <ruiling.song@intel.com>2019-09-26 08:12:36 +0800
commit4f589d668efdabc3764dcb0094929c2b4e01b35c (patch)
treed5496f42a88604d3cc0818194f4da9788bbe36b0 /libavfilter/x86
parent6aff2042d6483d6b9f07ef5165c8e31a871efee8 (diff)
downloadffmpeg-4f589d668efdabc3764dcb0094929c2b4e01b35c.tar.gz
avfilter/x86/vf_eq: add SSE2 version
Signed-off-by: Ting Fu <ting.fu@intel.com>
Diffstat (limited to 'libavfilter/x86')
-rw-r--r--libavfilter/x86/vf_eq.asm12
-rw-r--r--libavfilter/x86/vf_eq_init.c19
2 files changed, 29 insertions, 2 deletions
diff --git a/libavfilter/x86/vf_eq.asm b/libavfilter/x86/vf_eq.asm
index 8460342896..a30a287029 100644
--- a/libavfilter/x86/vf_eq.asm
+++ b/libavfilter/x86/vf_eq.asm
@@ -24,7 +24,7 @@
SECTION .text
-INIT_MMX mmxext
+%macro PROCESS_ONE_LINE 1
cglobal process_one_line, 5, 7, 5, src, dst, contrast, brightness, w
movd m3, contrastd
movd m4, brightnessd
@@ -39,7 +39,7 @@ cglobal process_one_line, 5, 7, 5, src, dst, contrast, brightness, w
pxor m1, m1
mov scalard, wd
and scalard, mmsize-1
- sar wd, 3
+ sar wd, %1
cmp wd, 1
jl .loop1
@@ -80,3 +80,11 @@ cglobal process_one_line, 5, 7, 5, src, dst, contrast, brightness, w
.end:
RET
+
+%endmacro
+
+INIT_MMX mmxext
+PROCESS_ONE_LINE 3
+
+INIT_XMM sse2
+PROCESS_ONE_LINE 4
diff --git a/libavfilter/x86/vf_eq_init.c b/libavfilter/x86/vf_eq_init.c
index 089961ffb2..52848d5996 100644
--- a/libavfilter/x86/vf_eq_init.c
+++ b/libavfilter/x86/vf_eq_init.c
@@ -28,6 +28,8 @@
extern void ff_process_one_line_mmxext(const uint8_t *src, uint8_t *dst, short contrast,
short brightness, int w);
+extern void ff_process_one_line_sse2(const uint8_t *src, uint8_t *dst, short contrast,
+ short brightness, int w);
static void process_mmxext(EQParameters *param, uint8_t *dst, int dst_stride,
const uint8_t *src, int src_stride, int w, int h)
@@ -44,6 +46,20 @@ static void process_mmxext(EQParameters *param, uint8_t *dst, int dst_stride,
emms_c();
}
+static void process_sse2(EQParameters *param, uint8_t *dst, int dst_stride,
+ const uint8_t *src, int src_stride, int w, int h)
+{
+ short contrast = (short) (param->contrast * 256 * 16);
+ short brightness = ((short) (100.0 * param->brightness + 100.0) * 511)
+ / 200 - 128 - contrast / 32;
+
+ while (h--) {
+ ff_process_one_line_sse2(src, dst, contrast, brightness, w);
+ src += src_stride;
+ dst += dst_stride;
+ }
+}
+
av_cold void ff_eq_init_x86(EQContext *eq)
{
int cpu_flags = av_get_cpu_flags();
@@ -51,4 +67,7 @@ av_cold void ff_eq_init_x86(EQContext *eq)
if (cpu_flags & AV_CPU_FLAG_MMXEXT) {
eq->process = process_mmxext;
}
+ if (cpu_flags & AV_CPU_FLAG_SSE2) {
+ eq->process = process_sse2;
+ }
}