1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
|
/**
* Copyright (C) 2025 Niklas Haas
*
* This file is part of FFmpeg.
*
* FFmpeg is free software; you can redistribute it and/or
* modify it under the terms of the GNU Lesser General Public
* License as published by the Free Software Foundation; either
* version 2.1 of the License, or (at your option) any later version.
*
* FFmpeg is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with FFmpeg; if not, write to the Free Software
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
*/
#include "ops_backend.h"
#if AV_GCC_VERSION_AT_LEAST(4, 4)
#pragma GCC optimize ("finite-math-only")
#endif
/* Array-based reference implementation */
#ifndef SWS_BLOCK_SIZE
# define SWS_BLOCK_SIZE 32
#endif
typedef uint8_t u8block_t[SWS_BLOCK_SIZE];
typedef uint16_t u16block_t[SWS_BLOCK_SIZE];
typedef uint32_t u32block_t[SWS_BLOCK_SIZE];
typedef float f32block_t[SWS_BLOCK_SIZE];
#define BIT_DEPTH 8
# include "ops_tmpl_int.c"
#undef BIT_DEPTH
#define BIT_DEPTH 16
# include "ops_tmpl_int.c"
#undef BIT_DEPTH
#define BIT_DEPTH 32
# include "ops_tmpl_int.c"
# include "ops_tmpl_float.c"
#undef BIT_DEPTH
static void process(const SwsOpExec *exec, const void *priv,
const int bx_start, const int y_start, int bx_end, int y_end)
{
const SwsOpChain *chain = priv;
const SwsOpImpl *impl = chain->impl;
SwsOpIter iter;
for (iter.y = y_start; iter.y < y_end; iter.y++) {
for (int i = 0; i < 4; i++) {
iter.in[i] = exec->in[i] + (iter.y - y_start) * exec->in_stride[i];
iter.out[i] = exec->out[i] + (iter.y - y_start) * exec->out_stride[i];
}
for (int block = bx_start; block < bx_end; block++) {
iter.x = block * SWS_BLOCK_SIZE;
((void (*)(SwsOpIter *, const SwsOpImpl *)) impl->cont)
(&iter, &impl[1]);
}
}
}
static int compile(SwsContext *ctx, SwsOpList *ops, SwsCompiledOp *out)
{
int ret;
SwsOpChain *chain = ff_sws_op_chain_alloc();
if (!chain)
return AVERROR(ENOMEM);
static const SwsOpTable *const tables[] = {
&bitfn(op_table_int, u8),
&bitfn(op_table_int, u16),
&bitfn(op_table_int, u32),
&bitfn(op_table_float, f32),
};
do {
ret = ff_sws_op_compile_tables(tables, FF_ARRAY_ELEMS(tables), ops,
SWS_BLOCK_SIZE, chain);
} while (ret == AVERROR(EAGAIN));
if (ret < 0) {
ff_sws_op_chain_free(chain);
return ret;
}
*out = (SwsCompiledOp) {
.func = process,
.block_size = SWS_BLOCK_SIZE,
.cpu_flags = chain->cpu_flags,
.priv = chain,
.free = ff_sws_op_chain_free_cb,
};
return 0;
}
const SwsOpBackend backend_c = {
.name = "c",
.compile = compile,
};
|