aboutsummaryrefslogtreecommitdiffstats
path: root/libavcodec/x86/h26x/h2656dsp.h
blob: 0ea08b6a20a162ae45c6639844da4d267b1610d3 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
/*
 * DSP for HEVC/VVC
 *
 * Copyright (C) 2022-2024 Nuo Mi
 * Copyright (c) 2023-2024 Wu Jianhua
 *
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * FFmpeg is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with FFmpeg; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

#ifndef AVCODEC_X86_H26X_H2656DSP_H
#define AVCODEC_X86_H26X_H2656DSP_H

#include "config.h"
#include "libavutil/x86/asm.h"
#include "libavutil/x86/cpu.h"
#include <stdlib.h>

#define H2656_PEL_PROTOTYPE(name, D, opt) \
void ff_h2656_put_ ## name ## _ ## D ## _##opt(int16_t *dst, ptrdiff_t dststride, const uint8_t *_src, ptrdiff_t _srcstride, int height, const int8_t *hf, const int8_t *vf, int width);          \
void ff_h2656_put_uni_ ## name ## _ ## D ## _##opt(uint8_t *_dst, ptrdiff_t _dststride, const uint8_t *_src, ptrdiff_t _srcstride, int height, const int8_t *hf, const int8_t *vf, int width)     \

#define H2656_MC_8TAP_PROTOTYPES(fname, bitd, opt)    \
    H2656_PEL_PROTOTYPE(fname##4,  bitd, opt);        \
    H2656_PEL_PROTOTYPE(fname##6,  bitd, opt);        \
    H2656_PEL_PROTOTYPE(fname##8,  bitd, opt);        \
    H2656_PEL_PROTOTYPE(fname##12,  bitd, opt);       \
    H2656_PEL_PROTOTYPE(fname##16, bitd, opt);        \
    H2656_PEL_PROTOTYPE(fname##32, bitd, opt);        \
    H2656_PEL_PROTOTYPE(fname##64, bitd, opt);        \
    H2656_PEL_PROTOTYPE(fname##128, bitd, opt)

H2656_MC_8TAP_PROTOTYPES(pixels  ,  8, sse4);
H2656_MC_8TAP_PROTOTYPES(pixels  , 10, sse4);
H2656_MC_8TAP_PROTOTYPES(pixels  , 12, sse4);
H2656_MC_8TAP_PROTOTYPES(8tap_h  ,  8, sse4);
H2656_MC_8TAP_PROTOTYPES(8tap_h  , 10, sse4);
H2656_MC_8TAP_PROTOTYPES(8tap_h  , 12, sse4);
H2656_MC_8TAP_PROTOTYPES(8tap_v  ,  8, sse4);
H2656_MC_8TAP_PROTOTYPES(8tap_v  , 10, sse4);
H2656_MC_8TAP_PROTOTYPES(8tap_v  , 12, sse4);
H2656_MC_8TAP_PROTOTYPES(8tap_hv ,  8, sse4);
H2656_MC_8TAP_PROTOTYPES(8tap_hv , 10, sse4);
H2656_MC_8TAP_PROTOTYPES(8tap_hv , 12, sse4);

#define H2656_MC_4TAP_PROTOTYPES(fname, bitd, opt)    \
    H2656_PEL_PROTOTYPE(fname##2,  bitd, opt);        \
    H2656_PEL_PROTOTYPE(fname##4,  bitd, opt);        \
    H2656_PEL_PROTOTYPE(fname##6,  bitd, opt);        \
    H2656_PEL_PROTOTYPE(fname##8,  bitd, opt);        \
    H2656_PEL_PROTOTYPE(fname##12, bitd, opt);        \
    H2656_PEL_PROTOTYPE(fname##16, bitd, opt);        \
    H2656_PEL_PROTOTYPE(fname##32, bitd, opt);        \
    H2656_PEL_PROTOTYPE(fname##64, bitd, opt);        \
    H2656_PEL_PROTOTYPE(fname##128, bitd, opt)

#define H2656_MC_4TAP_PROTOTYPES_SSE4(bitd)           \
    H2656_PEL_PROTOTYPE(pixels2, bitd, sse4);         \
    H2656_MC_4TAP_PROTOTYPES(4tap_h, bitd, sse4);     \
    H2656_MC_4TAP_PROTOTYPES(4tap_v, bitd, sse4);     \
    H2656_MC_4TAP_PROTOTYPES(4tap_hv, bitd, sse4);    \

H2656_MC_4TAP_PROTOTYPES_SSE4(8)
H2656_MC_4TAP_PROTOTYPES_SSE4(10)
H2656_MC_4TAP_PROTOTYPES_SSE4(12)

#define H2656_MC_8TAP_PROTOTYPES_AVX2(fname)              \
    H2656_PEL_PROTOTYPE(fname##32 , 8, avx2);             \
    H2656_PEL_PROTOTYPE(fname##64 , 8, avx2);             \
    H2656_PEL_PROTOTYPE(fname##128, 8, avx2);             \
    H2656_PEL_PROTOTYPE(fname##16 ,10, avx2);             \
    H2656_PEL_PROTOTYPE(fname##32 ,10, avx2);             \
    H2656_PEL_PROTOTYPE(fname##64 ,10, avx2);             \
    H2656_PEL_PROTOTYPE(fname##128,10, avx2);             \
    H2656_PEL_PROTOTYPE(fname##16 ,12, avx2);             \
    H2656_PEL_PROTOTYPE(fname##32 ,12, avx2);             \
    H2656_PEL_PROTOTYPE(fname##64 ,12, avx2);             \
    H2656_PEL_PROTOTYPE(fname##128,12, avx2)              \

H2656_MC_8TAP_PROTOTYPES_AVX2(pixels);
H2656_MC_8TAP_PROTOTYPES_AVX2(8tap_h);
H2656_MC_8TAP_PROTOTYPES_AVX2(8tap_v);
H2656_MC_8TAP_PROTOTYPES_AVX2(8tap_hv);
H2656_PEL_PROTOTYPE(8tap_hv16, 8, avx2);

H2656_MC_8TAP_PROTOTYPES_AVX2(4tap_h);
H2656_MC_8TAP_PROTOTYPES_AVX2(4tap_v);
H2656_MC_8TAP_PROTOTYPES_AVX2(4tap_hv);

#endif