35 #define LB_MASK 0x00FEFEFE
36 #define RED_BLUE_MASK 0x00FF00FF
37 #define GREEN_MASK 0x0000FF00
57 #define OFFSET(x) offsetof(XBRContext, x)
58 #define FLAGS AV_OPT_FLAG_FILTERING_PARAM|AV_OPT_FLAG_VIDEO_PARAM
66 static uint32_t
pixel_diff(uint32_t x, uint32_t y,
const uint32_t *r2y)
68 #define YMASK 0xff0000
69 #define UMASK 0x00ff00
70 #define VMASK 0x0000ff
71 #define ABSDIFF(a,b) (abs((int)(a)-(int)(b)))
73 uint32_t yuv1 = r2y[x & 0xffffff];
74 uint32_t yuv2 = r2y[y & 0xffffff];
81 #define ALPHA_BLEND_128_W(a, b) ((((a) & LB_MASK) >> 1) + (((b) & LB_MASK) >> 1))
82 #define ALPHA_BLEND_BASE(a, b, m, s) ( (RED_BLUE_MASK & (((a) & RED_BLUE_MASK) + (((((b) & RED_BLUE_MASK) - ((a) & RED_BLUE_MASK)) * (m)) >> (s)))) \
83 | (GREEN_MASK & (((a) & GREEN_MASK) + (((((b) & GREEN_MASK) - ((a) & GREEN_MASK)) * (m)) >> (s)))))
84 #define ALPHA_BLEND_32_W(a, b) ALPHA_BLEND_BASE(a, b, 1, 3)
85 #define ALPHA_BLEND_64_W(a, b) ALPHA_BLEND_BASE(a, b, 1, 2)
86 #define ALPHA_BLEND_192_W(a, b) ALPHA_BLEND_BASE(a, b, 3, 2)
87 #define ALPHA_BLEND_224_W(a, b) ALPHA_BLEND_BASE(a, b, 7, 3)
89 #define df(A, B) pixel_diff(A, B, r2y)
90 #define eq(A, B) (df(A, B) < 155)
92 #define FILT2(PE, PI, PH, PF, PG, PC, PD, PB, PA, G5, C4, G0, D0, C1, B1, F4, I4, H5, I5, A0, A1, \
93 N0, N1, N2, N3) do { \
94 if (PE != PH && PE != PF) { \
95 const unsigned e = df(PE,PC) + df(PE,PG) + df(PI,H5) + df(PI,F4) + (df(PH,PF)<<2); \
96 const unsigned i = df(PH,PD) + df(PH,I5) + df(PF,I4) + df(PF,PB) + (df(PE,PI)<<2); \
98 const unsigned px = df(PE,PF) <= df(PE,PH) ? PF : PH; \
99 if (e < i && (!eq(PF,PB) && !eq(PH,PD) || eq(PE,PI) \
100 && (!eq(PF,I4) && !eq(PH,I5)) \
101 || eq(PE,PG) || eq(PE,PC))) { \
102 const unsigned ke = df(PF,PG); \
103 const unsigned ki = df(PH,PC); \
104 const int left = ke<<1 <= ki && PE != PG && PD != PG; \
105 const int up = ke >= ki<<1 && PE != PC && PB != PC; \
107 E[N3] = ALPHA_BLEND_224_W(E[N3], px); \
108 E[N2] = ALPHA_BLEND_64_W( E[N2], px); \
111 E[N3] = ALPHA_BLEND_192_W(E[N3], px); \
112 E[N2] = ALPHA_BLEND_64_W( E[N2], px); \
114 E[N3] = ALPHA_BLEND_192_W(E[N3], px); \
115 E[N1] = ALPHA_BLEND_64_W( E[N1], px); \
117 E[N3] = ALPHA_BLEND_128_W(E[N3], px); \
120 E[N3] = ALPHA_BLEND_128_W(E[N3], px); \
126 #define FILT3(PE, PI, PH, PF, PG, PC, PD, PB, PA, G5, C4, G0, D0, C1, B1, F4, I4, H5, I5, A0, A1, \
127 N0, N1, N2, N3, N4, N5, N6, N7, N8) do { \
128 if (PE != PH && PE != PF) { \
129 const unsigned e = df(PE,PC) + df(PE,PG) + df(PI,H5) + df(PI,F4) + (df(PH,PF)<<2); \
130 const unsigned i = df(PH,PD) + df(PH,I5) + df(PF,I4) + df(PF,PB) + (df(PE,PI)<<2); \
132 const unsigned px = df(PE,PF) <= df(PE,PH) ? PF : PH; \
133 if (e < i && (!eq(PF,PB) && !eq(PF,PC) || !eq(PH,PD) && !eq(PH,PG) || eq(PE,PI) \
134 && (!eq(PF,F4) && !eq(PF,I4) || !eq(PH,H5) && !eq(PH,I5)) \
135 || eq(PE,PG) || eq(PE,PC))) { \
136 const unsigned ke = df(PF,PG); \
137 const unsigned ki = df(PH,PC); \
138 const int left = ke<<1 <= ki && PE != PG && PD != PG; \
139 const int up = ke >= ki<<1 && PE != PC && PB != PC; \
141 E[N7] = ALPHA_BLEND_192_W(E[N7], px); \
142 E[N6] = ALPHA_BLEND_64_W( E[N6], px); \
147 E[N7] = ALPHA_BLEND_192_W(E[N7], px); \
148 E[N5] = ALPHA_BLEND_64_W( E[N5], px); \
149 E[N6] = ALPHA_BLEND_64_W( E[N6], px); \
152 E[N5] = ALPHA_BLEND_192_W(E[N5], px); \
153 E[N7] = ALPHA_BLEND_64_W( E[N7], px); \
154 E[N2] = ALPHA_BLEND_64_W( E[N2], px); \
157 E[N8] = ALPHA_BLEND_224_W(E[N8], px); \
158 E[N5] = ALPHA_BLEND_32_W( E[N5], px); \
159 E[N7] = ALPHA_BLEND_32_W( E[N7], px); \
162 E[N8] = ALPHA_BLEND_128_W(E[N8], px); \
168 #define FILT4(PE, PI, PH, PF, PG, PC, PD, PB, PA, G5, C4, G0, D0, C1, B1, F4, I4, H5, I5, A0, A1, \
169 N15, N14, N11, N3, N7, N10, N13, N12, N9, N6, N2, N1, N5, N8, N4, N0) do { \
170 if (PE != PH && PE != PF) { \
171 const unsigned e = df(PE,PC) + df(PE,PG) + df(PI,H5) + df(PI,F4) + (df(PH,PF)<<2); \
172 const unsigned i = df(PH,PD) + df(PH,I5) + df(PF,I4) + df(PF,PB) + (df(PE,PI)<<2); \
174 const unsigned px = df(PE,PF) <= df(PE,PH) ? PF : PH; \
175 if (e < i && (!eq(PF,PB) && !eq(PH,PD) || eq(PE,PI) \
176 && (!eq(PF,I4) && !eq(PH,I5)) \
177 || eq(PE,PG) || eq(PE,PC))) { \
178 const unsigned ke = df(PF,PG); \
179 const unsigned ki = df(PH,PC); \
180 const int left = ke<<1 <= ki && PE != PG && PD != PG; \
181 const int up = ke >= ki<<1 && PE != PC && PB != PC; \
183 E[N13] = ALPHA_BLEND_192_W(E[N13], px); \
184 E[N12] = ALPHA_BLEND_64_W( E[N12], px); \
185 E[N15] = E[N14] = E[N11] = px; \
186 E[N10] = E[N3] = E[N12]; \
189 E[N11] = ALPHA_BLEND_192_W(E[N11], px); \
190 E[N13] = ALPHA_BLEND_192_W(E[N13], px); \
191 E[N10] = ALPHA_BLEND_64_W( E[N10], px); \
192 E[N12] = ALPHA_BLEND_64_W( E[N12], px); \
196 E[N14] = ALPHA_BLEND_192_W(E[N14], px); \
197 E[N7 ] = ALPHA_BLEND_192_W(E[N7 ], px); \
198 E[N10] = ALPHA_BLEND_64_W( E[N10], px); \
199 E[N3 ] = ALPHA_BLEND_64_W( E[N3 ], px); \
203 E[N11] = ALPHA_BLEND_128_W(E[N11], px); \
204 E[N14] = ALPHA_BLEND_128_W(E[N14], px); \
208 E[N15] = ALPHA_BLEND_128_W(E[N15], px); \
219 const uint32_t *r2y =
td->rgbtoyuv;
220 const int slice_start = (
input->height * jobnr ) / nb_jobs;
222 const int nl =
output->linesize[0] >> 2;
223 const int nl1 = nl + nl;
224 const int nl2 = nl1 + nl;
226 for (y = slice_start; y <
slice_end; y++) {
228 uint32_t *
E = (uint32_t *)(
output->data[0] + y *
output->linesize[0] * n);
229 const uint32_t *sa2 = (uint32_t *)(
input->data[0] + y *
input->linesize[0] - 8);
230 const uint32_t *sa1 = sa2 - (
input->linesize[0]>>2);
231 const uint32_t *sa0 = sa1 - (
input->linesize[0]>>2);
232 const uint32_t *sa3 = sa2 + (
input->linesize[0]>>2);
233 const uint32_t *sa4 = sa3 + (
input->linesize[0]>>2);
242 if (y >=
input->height - 2) {
244 if (y ==
input->height - 1) {
249 for (x = 0; x <
input->width; x++) {
250 const uint32_t
B1 = sa0[2];
251 const uint32_t PB = sa1[2];
252 const uint32_t PE = sa2[2];
253 const uint32_t PH = sa3[2];
254 const uint32_t H5 = sa4[2];
256 const int pprev = 2 - (x > 0);
257 const uint32_t
A1 = sa0[pprev];
258 const uint32_t PA = sa1[pprev];
259 const uint32_t
PD = sa2[pprev];
260 const uint32_t PG = sa3[pprev];
261 const uint32_t G5 = sa4[pprev];
263 const int pprev2 = pprev - (x > 1);
264 const uint32_t A0 = sa1[pprev2];
265 const uint32_t D0 = sa2[pprev2];
266 const uint32_t G0 = sa3[pprev2];
268 const int pnext = 3 - (x ==
input->width - 1);
269 const uint32_t
C1 = sa0[pnext];
270 const uint32_t PC = sa1[pnext];
271 const uint32_t
PF = sa2[pnext];
272 const uint32_t PI = sa3[pnext];
273 const uint32_t I5 = sa4[pnext];
275 const int pnext2 = pnext + 1 - (x >=
input->width - 2);
276 const uint32_t
C4 = sa1[pnext2];
277 const uint32_t F4 = sa2[pnext2];
278 const uint32_t I4 = sa3[pnext2];
282 E[nl] =
E[nl + 1] = PE;
284 FILT2(PE, PI, PH,
PF, PG, PC,
PD, PB, PA, G5,
C4, G0, D0,
C1,
B1, F4, I4, H5, I5, A0,
A1, 0, 1, nl, nl+1);
285 FILT2(PE, PC,
PF, PB, PI, PA, PH,
PD, PG, I4,
A1, I5, H5, A0, D0,
B1,
C1, F4,
C4, G5, G0, nl, 0, nl+1, 1);
286 FILT2(PE, PA, PB,
PD, PC, PG,
PF, PH, PI,
C1, G0,
C4, F4, G5, H5, D0, A0,
B1,
A1, I4, I5, nl+1, nl, 1, 0);
287 FILT2(PE, PG,
PD, PH, PA, PI, PB,
PF, PC, A0, I5,
A1,
B1, I4, F4, H5, G5, D0, G0,
C1,
C4, 1, nl+1, 0, nl);
290 E[nl] =
E[nl+1] =
E[nl+2] =
291 E[nl1] =
E[nl1+1] =
E[nl1+2] = PE;
293 FILT3(PE, PI, PH,
PF, PG, PC,
PD, PB, PA, G5,
C4, G0, D0,
C1,
B1, F4, I4, H5, I5, A0,
A1, 0, 1, 2, nl, nl+1, nl+2, nl1, nl1+1, nl1+2);
294 FILT3(PE, PC,
PF, PB, PI, PA, PH,
PD, PG, I4,
A1, I5, H5, A0, D0,
B1,
C1, F4,
C4, G5, G0, nl1, nl, 0, nl1+1, nl+1, 1, nl1+2, nl+2, 2);
295 FILT3(PE, PA, PB,
PD, PC, PG,
PF, PH, PI,
C1, G0,
C4, F4, G5, H5, D0, A0,
B1,
A1, I4, I5, nl1+2, nl1+1, nl1, nl+2, nl+1, nl, 2, 1, 0);
296 FILT3(PE, PG,
PD, PH, PA, PI, PB,
PF, PC, A0, I5,
A1,
B1, I4, F4, H5, G5, D0, G0,
C1,
C4, 2, nl+2, nl1+2, 1, nl+1, nl1+1, 0, nl, nl1);
298 E[0] =
E[1] =
E[2] =
E[3] =
299 E[nl] =
E[nl+1] =
E[nl+2] =
E[nl+3] =
300 E[nl1] =
E[nl1+1] =
E[nl1+2] =
E[nl1+3] =
301 E[nl2] =
E[nl2+1] =
E[nl2+2] =
E[nl2+3] = PE;
303 FILT4(PE, PI, PH,
PF, PG, PC,
PD, PB, PA, G5,
C4, G0, D0,
C1,
B1, F4, I4, H5, I5, A0,
A1, nl2+3, nl2+2, nl1+3, 3, nl+3, nl1+2, nl2+1, nl2, nl1+1, nl+2, 2, 1, nl+1, nl1, nl, 0);
304 FILT4(PE, PC,
PF, PB, PI, PA, PH,
PD, PG, I4,
A1, I5, H5, A0, D0,
B1,
C1, F4,
C4, G5, G0, 3, nl+3, 2, 0, 1, nl+2, nl1+3, nl2+3, nl1+2, nl+1, nl, nl1, nl1+1, nl2+2, nl2+1, nl2);
305 FILT4(PE, PA, PB,
PD, PC, PG,
PF, PH, PI,
C1, G0,
C4, F4, G5, H5, D0, A0,
B1,
A1, I4, I5, 0, 1, nl, nl2, nl1, nl+1, 2, 3, nl+2, nl1+1, nl2+1, nl2+2, nl1+2, nl+3, nl1+3, nl2+3);
306 FILT4(PE, PG,
PD, PH, PA, PI, PB,
PF, PC, A0, I5,
A1,
B1, I4, F4, H5, G5, D0, G0,
C1,
C4, nl2, nl1, nl2+1, nl2+3, nl2+2, nl1+1, nl, 0, nl+1, nl1+2, nl1+3, nl+3, nl+2, 1, 2, 3);
320 #define XBR_FUNC(size) \
321 static int xbr##size##x(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs) \
323 xbr_filter(arg, jobnr, nb_jobs, size); \
360 td.rgbtoyuv =
s->rgbtoyuv;
364 out->width = outlink->
w;
365 out->height = outlink->
h;
374 static const xbrfunc_t xbrfuncs[] = {xbr2x, xbr3x, xbr4x};
379 for (bg = -255; bg < 256; bg++) {
380 for (rg = -255; rg < 256; rg++) {
381 const uint32_t
u = (uint32_t)((-169*rg + 500*bg)/1000) + 128;
382 const uint32_t v = (uint32_t)(( 500*rg - 81*bg)/1000) + 128;
383 int startg =
FFMAX3(-bg, -rg, 0);
384 int endg =
FFMIN3(255-bg, 255-rg, 255);
385 uint32_t y = (uint32_t)(( 299*rg + 1000*startg + 114*bg)/1000);
386 c = bg + rg * (1 << 16) + 0x010101 * startg;
387 for (
g = startg;
g <= endg;
g++) {
388 s->rgbtoyuv[
c] = ((y++) << 16) + (
u << 8) + v;
394 s->func = xbrfuncs[
s->n - 2];
421 .priv_class = &xbr_class,