FFmpeg
ops_optimizer.c
Go to the documentation of this file.
1 /**
2  * Copyright (C) 2025 Niklas Haas
3  *
4  * This file is part of FFmpeg.
5  *
6  * FFmpeg is free software; you can redistribute it and/or
7  * modify it under the terms of the GNU Lesser General Public
8  * License as published by the Free Software Foundation; either
9  * version 2.1 of the License, or (at your option) any later version.
10  *
11  * FFmpeg is distributed in the hope that it will be useful,
12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14  * Lesser General Public License for more details.
15  *
16  * You should have received a copy of the GNU Lesser General Public
17  * License along with FFmpeg; if not, write to the Free Software
18  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19  */
20 
21 #include "libavutil/avassert.h"
22 #include "libavutil/bswap.h"
23 #include "libavutil/rational.h"
24 
25 #include "ops.h"
26 #include "ops_internal.h"
27 
28 #define RET(x) \
29  do { \
30  if ((ret = (x)) < 0) \
31  return ret; \
32  } while (0)
33 
34 /**
35  * Try to commute a clear op with the next operation. Makes any adjustments
36  * to the operations as needed, but does not perform the actual commutation.
37  *
38  * Returns whether successful.
39  */
40 static bool op_commute_clear(SwsOp *op, SwsOp *next)
41 {
42  SwsOp tmp;
43 
44  av_assert1(op->op == SWS_OP_CLEAR);
45  switch (next->op) {
46  case SWS_OP_CONVERT:
47  op->type = next->convert.to;
48  /* fall through */
49  case SWS_OP_LSHIFT:
50  case SWS_OP_RSHIFT:
51  case SWS_OP_DITHER:
52  case SWS_OP_MIN:
53  case SWS_OP_MAX:
54  case SWS_OP_SCALE:
55  case SWS_OP_READ:
56  case SWS_OP_SWIZZLE:
57  case SWS_OP_FILTER_H:
58  case SWS_OP_FILTER_V:
59  ff_sws_apply_op_q(next, op->c.q4);
60  return true;
61  case SWS_OP_SWAP_BYTES:
62  switch (next->type) {
63  case SWS_PIXEL_U16:
64  ff_sws_apply_op_q(next, op->c.q4); /* always works */
65  return true;
66  case SWS_PIXEL_U32:
67  for (int i = 0; i < 4; i++) {
68  uint32_t v = av_bswap32(op->c.q4[i].num);
69  if (v > INT_MAX)
70  return false; /* can't represent as AVRational anymore */
71  tmp.c.q4[i] = Q(v);
72  }
73  op->c = tmp.c;
74  return true;
75  default:
76  return false;
77  }
78  case SWS_OP_INVALID:
79  case SWS_OP_WRITE:
80  case SWS_OP_LINEAR:
81  case SWS_OP_PACK:
82  case SWS_OP_UNPACK:
83  case SWS_OP_CLEAR:
84  return false;
85  case SWS_OP_TYPE_NB:
86  break;
87  }
88 
89  av_unreachable("Invalid operation type!");
90  return false;
91 }
92 
93  /**
94  * Try to commute a swizzle op with the next operation. Makes any adjustments
95  * to the operations as needed, but does not perform the actual commutation.
96  *
97  * Returns whether successful.
98  */
99 static bool op_commute_swizzle(SwsOp *op, SwsOp *next)
100 {
101  bool seen[4] = {0};
102 
103  av_assert1(op->op == SWS_OP_SWIZZLE);
104  switch (next->op) {
105  case SWS_OP_CONVERT:
106  op->type = next->convert.to;
107  /* fall through */
108  case SWS_OP_SWAP_BYTES:
109  case SWS_OP_LSHIFT:
110  case SWS_OP_RSHIFT:
111  case SWS_OP_SCALE:
112  case SWS_OP_FILTER_H:
113  case SWS_OP_FILTER_V:
114  return true;
115 
116  /**
117  * We can commute per-channel ops only if the per-channel constants are the
118  * same for all duplicated channels; e.g.:
119  * SWIZZLE {0, 0, 0, 3}
120  * NEXT {x, x, x, w}
121  * ->
122  * NEXT {x, _, _, w}
123  * SWIZZLE {0, 0, 0, 3}
124  */
125  case SWS_OP_MIN:
126  case SWS_OP_MAX: {
127  const SwsConst c = next->c;
128  for (int i = 0; i < 4; i++) {
129  if (!SWS_OP_NEEDED(op, i))
130  continue;
131  const int j = op->swizzle.in[i];
132  if (seen[j] && av_cmp_q(next->c.q4[j], c.q4[i]))
133  return false;
134  next->c.q4[j] = c.q4[i];
135  seen[j] = true;
136  }
137  return true;
138  }
139 
140  case SWS_OP_DITHER: {
141  const SwsDitherOp d = next->dither;
142  for (int i = 0; i < 4; i++) {
143  if (!SWS_OP_NEEDED(op, i))
144  continue;
145  const int j = op->swizzle.in[i];
146  if (seen[j] && next->dither.y_offset[j] != d.y_offset[i])
147  return false;
148  next->dither.y_offset[j] = d.y_offset[i];
149  seen[j] = true;
150  }
151  return true;
152  }
153 
154  case SWS_OP_INVALID:
155  case SWS_OP_READ:
156  case SWS_OP_WRITE:
157  case SWS_OP_SWIZZLE:
158  case SWS_OP_CLEAR:
159  case SWS_OP_LINEAR:
160  case SWS_OP_PACK:
161  case SWS_OP_UNPACK:
162  return false;
163  case SWS_OP_TYPE_NB:
164  break;
165  }
166 
167  av_unreachable("Invalid operation type!");
168  return false;
169 }
170 
171 /**
172  * Try to commute a filter op with the previous operation. Makes any
173  * adjustments to the operations as needed, but does not perform the actual
174  * commutation.
175  *
176  * Returns whether successful.
177  */
178 static bool op_commute_filter(SwsOp *op, SwsOp *prev)
179 {
180  switch (prev->op) {
181  case SWS_OP_SWIZZLE:
182  case SWS_OP_SCALE:
183  case SWS_OP_LINEAR:
184  case SWS_OP_DITHER:
185  prev->type = SWS_PIXEL_F32;
186  return true;
187  case SWS_OP_CONVERT:
188  if (prev->convert.to == SWS_PIXEL_F32) {
189  av_assert0(!prev->convert.expand);
190  FFSWAP(SwsPixelType, op->type, prev->type);
191  return true;
192  }
193  return false;
194  case SWS_OP_INVALID:
195  case SWS_OP_READ:
196  case SWS_OP_WRITE:
197  case SWS_OP_SWAP_BYTES:
198  case SWS_OP_UNPACK:
199  case SWS_OP_PACK:
200  case SWS_OP_LSHIFT:
201  case SWS_OP_RSHIFT:
202  case SWS_OP_CLEAR:
203  case SWS_OP_MIN:
204  case SWS_OP_MAX:
205  case SWS_OP_FILTER_H:
206  case SWS_OP_FILTER_V:
207  return false;
208  case SWS_OP_TYPE_NB:
209  break;
210  }
211 
212  av_unreachable("Invalid operation type!");
213  return false;
214 }
215 
216 /* returns log2(x) only if x is a power of two, or 0 otherwise */
217 static int exact_log2(const int x)
218 {
219  int p;
220  if (x <= 0)
221  return 0;
222  p = av_log2(x);
223  return (1 << p) == x ? p : 0;
224 }
225 
226 static int exact_log2_q(const AVRational x)
227 {
228  if (x.den == 1)
229  return exact_log2(x.num);
230  else if (x.num == 1)
231  return -exact_log2(x.den);
232  else
233  return 0;
234 }
235 
236 /**
237  * If a linear operation can be reduced to a scalar multiplication, returns
238  * the corresponding scaling factor, or 0 otherwise.
239  */
240 static bool extract_scalar(const SwsLinearOp *c, SwsComps comps, SwsComps prev,
241  SwsConst *out_scale)
242 {
243  SwsConst scale = {0};
244 
245  /* There are components not on the main diagonal */
246  if (c->mask & ~SWS_MASK_DIAG4)
247  return false;
248 
249  for (int i = 0; i < 4; i++) {
250  const AVRational s = c->m[i][i];
251  if ((prev.flags[i] & SWS_COMP_ZERO) ||
252  (comps.flags[i] & SWS_COMP_GARBAGE))
253  continue;
254  if (scale.q.den && av_cmp_q(s, scale.q))
255  return false;
256  scale.q = s;
257  }
258 
259  if (scale.q.den)
260  *out_scale = scale;
261  return scale.q.den;
262 }
263 
264 /* Extracts an integer clear operation (subset) from the given linear op. */
266  SwsConst *out_clear)
267 {
268  SwsConst clear = {0};
269  bool ret = false;
270 
271  for (int i = 0; i < 4; i++) {
272  bool const_row = c->m[i][4].den == 1; /* offset is integer */
273  for (int j = 0; j < 4; j++) {
274  const_row &= c->m[i][j].num == 0 || /* scalar is zero */
275  (prev.flags[j] & SWS_COMP_ZERO); /* input is zero */
276  }
277  if (const_row && (c->mask & SWS_MASK_ROW(i))) {
278  clear.q4[i] = c->m[i][4];
279  for (int j = 0; j < 5; j++)
280  c->m[i][j] = Q(i == j);
281  c->mask &= ~SWS_MASK_ROW(i);
282  ret = true;
283  }
284  }
285 
286  if (ret)
287  *out_clear = clear;
288  return ret;
289 }
290 
291 /* Unswizzle a linear operation by aligning single-input rows with
292  * their corresponding diagonal */
293 static bool extract_swizzle(SwsLinearOp *op, SwsComps prev, SwsSwizzleOp *out_swiz)
294 {
295  SwsSwizzleOp swiz = SWS_SWIZZLE(0, 1, 2, 3);
296  SwsLinearOp c = *op;
297 
298  /* Find non-zero coefficients in the main 4x4 matrix */
299  uint32_t nonzero = 0;
300  for (int i = 0; i < 4; i++) {
301  for (int j = 0; j < 4; j++) {
302  if (!c.m[i][j].num || (prev.flags[j] & SWS_COMP_ZERO))
303  continue;
304  nonzero |= SWS_MASK(i, j);
305  }
306  }
307 
308  /* If a value is unique in its row and the target column is
309  * empty, move it there and update the input swizzle */
310  for (int i = 0; i < 4; i++) {
311  if (nonzero & SWS_MASK_COL(i))
312  continue; /* target column is not empty */
313  for (int j = 0; j < 4; j++) {
314  if ((nonzero & SWS_MASK_ROW(i)) == SWS_MASK(i, j)) {
315  /* Move coefficient to the diagonal */
316  c.m[i][i] = c.m[i][j];
317  c.m[i][j] = Q(0);
318  swiz.in[i] = j;
319  break;
320  }
321  }
322  }
323 
324  if (swiz.mask == SWS_SWIZZLE(0, 1, 2, 3).mask)
325  return false; /* no swizzle was identified */
326 
327  c.mask = ff_sws_linear_mask(c);
328  *out_swiz = swiz;
329  *op = c;
330  return true;
331 }
332 
334 {
335  int ret;
336 
337 retry:
339 
340  /* Try to push filters towards the input; do this first to unblock
341  * in-place optimizations like linear op fusion */
342  for (int n = 1; n < ops->num_ops; n++) {
343  SwsOp *op = &ops->ops[n];
344  SwsOp *prev = &ops->ops[n - 1];
345 
346  switch (op->op) {
347  case SWS_OP_FILTER_H:
348  case SWS_OP_FILTER_V:
349  if (op_commute_filter(op, prev)) {
350  FFSWAP(SwsOp, *op, *prev);
351  goto retry;
352  }
353  break;
354  }
355  }
356 
357  /* Apply all in-place optimizations (that do not re-order the list) */
358  for (int n = 0; n < ops->num_ops; n++) {
359  SwsOp dummy = {0};
360  SwsOp *op = &ops->ops[n];
361  SwsOp *prev = n ? &ops->ops[n - 1] : &dummy;
362  SwsOp *next = n + 1 < ops->num_ops ? &ops->ops[n + 1] : &dummy;
363 
364  /* common helper variable */
365  bool noop = true;
366 
367  if (!SWS_OP_NEEDED(op, 0) && !SWS_OP_NEEDED(op, 1) &&
368  !SWS_OP_NEEDED(op, 2) && !SWS_OP_NEEDED(op, 3) &&
369  op->op != SWS_OP_WRITE)
370  {
371  /* Remove any operation whose output is not needed */
372  ff_sws_op_list_remove_at(ops, n, 1);
373  goto retry;
374  }
375 
376  switch (op->op) {
377  case SWS_OP_READ:
378  /* "Compress" planar reads where not all components are needed */
379  if (!op->rw.packed) {
380  SwsSwizzleOp swiz = SWS_SWIZZLE(0, 1, 2, 3);
381  int nb_planes = 0;
382  for (int i = 0; i < op->rw.elems; i++) {
383  if (!SWS_OP_NEEDED(op, i)) {
384  swiz.in[i] = 3 - (i - nb_planes); /* map to unused plane */
385  continue;
386  }
387 
388  const int idx = nb_planes++;
389  av_assert1(idx <= i);
390  ops->plane_src[idx] = ops->plane_src[i];
391  swiz.in[i] = idx;
392  }
393 
394  if (nb_planes < op->rw.elems) {
395  op->rw.elems = nb_planes;
396  RET(ff_sws_op_list_insert_at(ops, n + 1, &(SwsOp) {
397  .op = SWS_OP_SWIZZLE,
398  .type = op->rw.filter ? SWS_PIXEL_F32 : op->type,
399  .swizzle = swiz,
400  }));
401  goto retry;
402  }
403  }
404  break;
405 
406  case SWS_OP_SWAP_BYTES:
407  /* Redundant (double) swap */
408  if (next->op == SWS_OP_SWAP_BYTES) {
409  ff_sws_op_list_remove_at(ops, n, 2);
410  goto retry;
411  }
412  break;
413 
414  case SWS_OP_UNPACK:
415  /* Redundant unpack+pack */
416  if (next->op == SWS_OP_PACK && next->type == op->type &&
417  next->pack.pattern[0] == op->pack.pattern[0] &&
418  next->pack.pattern[1] == op->pack.pattern[1] &&
419  next->pack.pattern[2] == op->pack.pattern[2] &&
420  next->pack.pattern[3] == op->pack.pattern[3])
421  {
422  ff_sws_op_list_remove_at(ops, n, 2);
423  goto retry;
424  }
425  break;
426 
427  case SWS_OP_LSHIFT:
428  case SWS_OP_RSHIFT:
429  /* Two shifts in the same direction */
430  if (next->op == op->op) {
431  op->c.u += next->c.u;
432  ff_sws_op_list_remove_at(ops, n + 1, 1);
433  goto retry;
434  }
435 
436  /* No-op shift */
437  if (!op->c.u) {
438  ff_sws_op_list_remove_at(ops, n, 1);
439  goto retry;
440  }
441  break;
442 
443  case SWS_OP_CLEAR:
444  for (int i = 0; i < 4; i++) {
445  if (!op->c.q4[i].den)
446  continue;
447 
448  if ((prev->comps.flags[i] & SWS_COMP_ZERO) &&
449  !(prev->comps.flags[i] & SWS_COMP_GARBAGE) &&
450  op->c.q4[i].num == 0)
451  {
452  /* Redundant clear-to-zero of zero component */
453  op->c.q4[i].den = 0;
454  } else if (!SWS_OP_NEEDED(op, i)) {
455  /* Unnecessary clear of unused component */
456  op->c.q4[i] = (AVRational) {0, 0};
457  } else if (op->c.q4[i].den) {
458  noop = false;
459  }
460  }
461 
462  if (noop) {
463  ff_sws_op_list_remove_at(ops, n, 1);
464  goto retry;
465  }
466 
467  /* Transitive clear */
468  if (next->op == SWS_OP_CLEAR) {
469  for (int i = 0; i < 4; i++) {
470  if (next->c.q4[i].den)
471  op->c.q4[i] = next->c.q4[i];
472  }
473  ff_sws_op_list_remove_at(ops, n + 1, 1);
474  goto retry;
475  }
476  break;
477 
478  case SWS_OP_SWIZZLE:
479  for (int i = 0; i < 4; i++) {
480  if (!SWS_OP_NEEDED(op, i))
481  continue;
482  if (op->swizzle.in[i] != i)
483  noop = false;
484  }
485 
486  /* Identity swizzle */
487  if (noop) {
488  ff_sws_op_list_remove_at(ops, n, 1);
489  goto retry;
490  }
491 
492  /* Transitive swizzle */
493  if (next->op == SWS_OP_SWIZZLE) {
494  const SwsSwizzleOp orig = op->swizzle;
495  for (int i = 0; i < 4; i++)
496  op->swizzle.in[i] = orig.in[next->swizzle.in[i]];
497  ff_sws_op_list_remove_at(ops, n + 1, 1);
498  goto retry;
499  }
500 
501  /* Swizzle planes instead of components, if possible */
502  if (prev->op == SWS_OP_READ && !prev->rw.packed) {
503  for (int dst = 0; dst < prev->rw.elems; dst++) {
504  const int src = op->swizzle.in[dst];
505  if (src > dst && src < prev->rw.elems) {
506  FFSWAP(int, ops->plane_src[dst], ops->plane_src[src]);
507  for (int i = dst; i < 4; i++) {
508  if (op->swizzle.in[i] == dst)
509  op->swizzle.in[i] = src;
510  else if (op->swizzle.in[i] == src)
511  op->swizzle.in[i] = dst;
512  }
513  goto retry;
514  }
515  }
516  }
517 
518  if (next->op == SWS_OP_WRITE && !next->rw.packed) {
519  for (int dst = 0; dst < next->rw.elems; dst++) {
520  const int src = op->swizzle.in[dst];
521  if (src > dst && src < next->rw.elems) {
522  FFSWAP(int, ops->plane_dst[dst], ops->plane_dst[src]);
523  FFSWAP(int, op->swizzle.in[dst], op->swizzle.in[src]);
524  goto retry;
525  }
526  }
527  }
528  break;
529 
530  case SWS_OP_CONVERT:
531  /* No-op conversion */
532  if (op->type == op->convert.to) {
533  ff_sws_op_list_remove_at(ops, n, 1);
534  goto retry;
535  }
536 
537  /* Transitive conversion */
538  if (next->op == SWS_OP_CONVERT &&
539  op->convert.expand == next->convert.expand)
540  {
541  av_assert1(op->convert.to == next->type);
542  op->convert.to = next->convert.to;
543  ff_sws_op_list_remove_at(ops, n + 1, 1);
544  goto retry;
545  }
546 
547  /* Conversion followed by integer expansion */
548  if (next->op == SWS_OP_SCALE && !op->convert.expand &&
549  ff_sws_pixel_type_is_int(op->type) &&
550  ff_sws_pixel_type_is_int(op->convert.to) &&
551  !av_cmp_q(next->c.q, ff_sws_pixel_expand(op->type, op->convert.to)))
552  {
553  op->convert.expand = true;
554  ff_sws_op_list_remove_at(ops, n + 1, 1);
555  goto retry;
556  }
557  break;
558 
559  case SWS_OP_MIN:
560  for (int i = 0; i < 4; i++) {
561  if (!SWS_OP_NEEDED(op, i) || !op->c.q4[i].den)
562  continue;
563  if (av_cmp_q(op->c.q4[i], prev->comps.max[i]) < 0)
564  noop = false;
565  }
566 
567  if (noop) {
568  ff_sws_op_list_remove_at(ops, n, 1);
569  goto retry;
570  }
571  break;
572 
573  case SWS_OP_MAX:
574  for (int i = 0; i < 4; i++) {
575  if (!SWS_OP_NEEDED(op, i) || !op->c.q4[i].den)
576  continue;
577  if (av_cmp_q(prev->comps.min[i], op->c.q4[i]) < 0)
578  noop = false;
579  }
580 
581  if (noop) {
582  ff_sws_op_list_remove_at(ops, n, 1);
583  goto retry;
584  }
585  break;
586 
587  case SWS_OP_DITHER:
588  for (int i = 0; i < 4; i++) {
589  if (op->dither.y_offset[i] < 0)
590  continue;
591  if (!SWS_OP_NEEDED(op, i) || (prev->comps.flags[i] & SWS_COMP_EXACT)) {
592  op->dither.y_offset[i] = -1; /* unnecessary dither */
593  goto retry;
594  } else {
595  noop = false;
596  }
597  }
598 
599  if (noop) {
600  ff_sws_op_list_remove_at(ops, n, 1);
601  goto retry;
602  }
603  break;
604 
605  case SWS_OP_LINEAR: {
606  SwsSwizzleOp swizzle;
607  SwsConst c;
608 
609  /* No-op (identity) linear operation */
610  if (!op->lin.mask) {
611  ff_sws_op_list_remove_at(ops, n, 1);
612  goto retry;
613  }
614 
615  if (next->op == SWS_OP_LINEAR) {
616  /* 5x5 matrix multiplication after appending [ 0 0 0 0 1 ] */
617  const SwsLinearOp m1 = op->lin;
618  const SwsLinearOp m2 = next->lin;
619  for (int i = 0; i < 4; i++) {
620  for (int j = 0; j < 5; j++) {
621  AVRational sum = Q(0);
622  for (int k = 0; k < 4; k++)
623  sum = av_add_q(sum, av_mul_q(m2.m[i][k], m1.m[k][j]));
624  if (j == 4) /* m1.m[4][j] == 1 */
625  sum = av_add_q(sum, m2.m[i][4]);
626  op->lin.m[i][j] = sum;
627  }
628  }
629  op->lin.mask = ff_sws_linear_mask(op->lin);
630  ff_sws_op_list_remove_at(ops, n + 1, 1);
631  goto retry;
632  }
633 
634  /* Optimize away zero columns */
635  for (int j = 0; j < 4; j++) {
636  const uint32_t col = SWS_MASK_COL(j);
637  if (!(prev->comps.flags[j] & SWS_COMP_ZERO) || !(op->lin.mask & col))
638  continue;
639  for (int i = 0; i < 4; i++)
640  op->lin.m[i][j] = Q(i == j);
641  op->lin.mask &= ~col;
642  goto retry;
643  }
644 
645  /* Optimize away unused rows */
646  for (int i = 0; i < 4; i++) {
647  const uint32_t row = SWS_MASK_ROW(i);
648  if (SWS_OP_NEEDED(op, i) || !(op->lin.mask & row))
649  continue;
650  for (int j = 0; j < 5; j++)
651  op->lin.m[i][j] = Q(i == j);
652  op->lin.mask &= ~row;
653  goto retry;
654  }
655 
656  /* Convert constant rows to explicit clear instruction */
657  if (extract_constant_rows(&op->lin, prev->comps, &c)) {
658  RET(ff_sws_op_list_insert_at(ops, n + 1, &(SwsOp) {
659  .op = SWS_OP_CLEAR,
660  .type = op->type,
661  .comps = op->comps,
662  .c = c,
663  }));
664  goto retry;
665  }
666 
667  /* Multiplication by scalar constant */
668  if (extract_scalar(&op->lin, op->comps, prev->comps, &c)) {
669  op->op = SWS_OP_SCALE;
670  op->c = c;
671  goto retry;
672  }
673 
674  /* Swizzle by fixed pattern */
675  if (extract_swizzle(&op->lin, prev->comps, &swizzle)) {
676  RET(ff_sws_op_list_insert_at(ops, n, &(SwsOp) {
677  .op = SWS_OP_SWIZZLE,
678  .type = op->type,
679  .swizzle = swizzle,
680  }));
681  goto retry;
682  }
683  break;
684  }
685 
686  case SWS_OP_SCALE: {
687  const int factor2 = exact_log2_q(op->c.q);
688 
689  /* No-op scaling */
690  if (op->c.q.num == 1 && op->c.q.den == 1) {
691  ff_sws_op_list_remove_at(ops, n, 1);
692  goto retry;
693  }
694 
695  /* Merge consecutive scaling operations (that don't overflow) */
696  if (next->op == SWS_OP_SCALE) {
697  int64_t p = op->c.q.num * (int64_t) next->c.q.num;
698  int64_t q = op->c.q.den * (int64_t) next->c.q.den;
699  if (FFABS(p) <= INT_MAX && FFABS(q) <= INT_MAX) {
700  av_reduce(&op->c.q.num, &op->c.q.den, p, q, INT_MAX);
701  ff_sws_op_list_remove_at(ops, n + 1, 1);
702  goto retry;
703  }
704  }
705 
706  /* Scaling by exact power of two */
707  if (factor2 && ff_sws_pixel_type_is_int(op->type)) {
708  op->op = factor2 > 0 ? SWS_OP_LSHIFT : SWS_OP_RSHIFT;
709  op->c.u = FFABS(factor2);
710  goto retry;
711  }
712  break;
713  }
714 
715  case SWS_OP_FILTER_H:
716  case SWS_OP_FILTER_V:
717  /* Merge with prior simple planar read */
718  if (prev->op == SWS_OP_READ && !prev->rw.filter &&
719  !prev->rw.packed && !prev->rw.frac) {
720  prev->rw.filter = op->op;
721  prev->rw.kernel = av_refstruct_ref(op->filter.kernel);
722  ff_sws_op_list_remove_at(ops, n, 1);
723  goto retry;
724  }
725  break;
726  }
727  }
728 
729  /* Push clears to the back to void any unused components */
730  for (int n = 0; n < ops->num_ops - 1; n++) {
731  SwsOp *op = &ops->ops[n];
732  SwsOp *next = &ops->ops[n + 1];
733 
734  switch (op->op) {
735  case SWS_OP_CLEAR:
736  if (op_commute_clear(op, next)) {
737  FFSWAP(SwsOp, *op, *next);
738  goto retry;
739  }
740  break;
741  }
742  }
743 
744  /* Apply any remaining preferential re-ordering optimizations; do these
745  * last because they are more likely to block other optimizations if done
746  * too aggressively */
747  for (int n = 0; n < ops->num_ops - 1; n++) {
748  SwsOp *op = &ops->ops[n];
749  SwsOp *next = &ops->ops[n + 1];
750 
751  switch (op->op) {
752  case SWS_OP_SWIZZLE: {
753  /* Try to push swizzles towards the output */
754  if (op_commute_swizzle(op, next)) {
755  FFSWAP(SwsOp, *op, *next);
756  goto retry;
757  }
758  break;
759  }
760 
761  case SWS_OP_SCALE:
762  /* Scaling by integer before conversion to int */
763  if (op->c.q.den == 1 && next->op == SWS_OP_CONVERT &&
765  {
766  op->type = next->convert.to;
767  FFSWAP(SwsOp, *op, *next);
768  goto retry;
769  }
770  break;
771  }
772  }
773 
774  return 0;
775 }
776 
777 int ff_sws_solve_shuffle(const SwsOpList *const ops, uint8_t shuffle[],
778  int size, uint8_t clear_val,
779  int *read_bytes, int *write_bytes)
780 {
781  if (!ops->num_ops)
782  return AVERROR(EINVAL);
783 
784  const SwsOp *read = ff_sws_op_list_input(ops);
785  if (!read || read->rw.frac || read->rw.filter ||
786  (!read->rw.packed && read->rw.elems > 1))
787  return AVERROR(ENOTSUP);
788 
789  const int read_size = ff_sws_pixel_type_size(read->type);
790  uint32_t mask[4] = {0};
791  for (int i = 0; i < read->rw.elems; i++)
792  mask[i] = 0x01010101 * i * read_size + 0x03020100;
793 
794  for (int opidx = 1; opidx < ops->num_ops; opidx++) {
795  const SwsOp *op = &ops->ops[opidx];
796  switch (op->op) {
797  case SWS_OP_SWIZZLE: {
798  uint32_t orig[4] = { mask[0], mask[1], mask[2], mask[3] };
799  for (int i = 0; i < 4; i++)
800  mask[i] = orig[op->swizzle.in[i]];
801  break;
802  }
803 
804  case SWS_OP_SWAP_BYTES:
805  for (int i = 0; i < 4; i++) {
806  switch (ff_sws_pixel_type_size(op->type)) {
807  case 2: mask[i] = av_bswap16(mask[i]); break;
808  case 4: mask[i] = av_bswap32(mask[i]); break;
809  }
810  }
811  break;
812 
813  case SWS_OP_CLEAR:
814  for (int i = 0; i < 4; i++) {
815  if (!op->c.q4[i].den)
816  continue;
817  if (op->c.q4[i].num != 0 || !clear_val)
818  return AVERROR(ENOTSUP);
819  mask[i] = 0x1010101ul * clear_val;
820  }
821  break;
822 
823  case SWS_OP_CONVERT: {
824  if (!op->convert.expand)
825  return AVERROR(ENOTSUP);
826  for (int i = 0; i < 4; i++) {
827  switch (ff_sws_pixel_type_size(op->type)) {
828  case 1: mask[i] = 0x01010101 * (mask[i] & 0xFF); break;
829  case 2: mask[i] = 0x00010001 * (mask[i] & 0xFFFF); break;
830  }
831  }
832  break;
833  }
834 
835  case SWS_OP_WRITE: {
836  if (op->rw.frac || op->rw.filter ||
837  (!op->rw.packed && op->rw.elems > 1))
838  return AVERROR(ENOTSUP);
839 
840  /* Initialize to no-op */
841  memset(shuffle, clear_val, size);
842 
843  const int write_size = ff_sws_pixel_type_size(op->type);
844  const int read_chunk = read->rw.elems * read_size;
845  const int write_chunk = op->rw.elems * write_size;
846  const int num_groups = size / FFMAX(read_chunk, write_chunk);
847  for (int n = 0; n < num_groups; n++) {
848  const int base_in = n * read_chunk;
849  const int base_out = n * write_chunk;
850  for (int i = 0; i < op->rw.elems; i++) {
851  const int offset = base_out + i * write_size;
852  for (int b = 0; b < write_size; b++) {
853  const uint8_t idx = mask[i] >> (b * 8);
854  if (idx != clear_val)
855  shuffle[offset + b] = base_in + idx;
856  }
857  }
858  }
859 
860  *read_bytes = num_groups * read_chunk;
861  *write_bytes = num_groups * write_chunk;
862  return num_groups;
863  }
864 
865  default:
866  return AVERROR(ENOTSUP);
867  }
868  }
869 
870  return AVERROR(EINVAL);
871 }
872 
873 /**
874  * Determine a suitable intermediate buffer format for a given combination
875  * of pixel types and number of planes. The exact interpretation of these
876  * formats does not matter at all; since they will only ever be used as
877  * temporary intermediate buffers. We still need to pick *some* format as
878  * a consequence of ff_sws_graph_add_pass() taking an AVPixelFormat for the
879  * output buffer.
880  */
881 static enum AVPixelFormat get_planar_fmt(SwsPixelType type, int nb_planes)
882 {
883  switch (ff_sws_pixel_type_size(type)) {
884  case 1:
885  switch (nb_planes) {
886  case 1: return AV_PIX_FMT_GRAY8;
887  case 2: return AV_PIX_FMT_YUV444P; // FIXME: no 2-plane planar fmt
888  case 3: return AV_PIX_FMT_YUV444P;
889  case 4: return AV_PIX_FMT_YUVA444P;
890  }
891  break;
892  case 2:
893  switch (nb_planes) {
894  case 1: return AV_PIX_FMT_GRAY16;
895  case 2: return AV_PIX_FMT_YUV444P16; // FIXME: no 2-plane planar fmt
896  case 3: return AV_PIX_FMT_YUV444P16;
897  case 4: return AV_PIX_FMT_YUVA444P16;
898  }
899  break;
900  case 4:
901  switch (nb_planes) {
902  case 1: return AV_PIX_FMT_GRAYF32;
903  case 2: return AV_PIX_FMT_GBRPF32; // FIXME: no 2-plane planar fmt
904  case 3: return AV_PIX_FMT_GBRPF32;
905  case 4: return AV_PIX_FMT_GBRAPF32;
906  }
907  break;
908  }
909 
910  av_unreachable("Invalid pixel type or number of planes?");
911  return AV_PIX_FMT_NONE;
912 }
913 
914 static void get_input_size(const SwsOpList *ops, SwsFormat *fmt)
915 {
916  fmt->width = ops->src.width;
917  fmt->height = ops->src.height;
918 
919  const SwsOp *read = ff_sws_op_list_input(ops);
920  if (read && read->rw.filter == SWS_OP_FILTER_V) {
921  fmt->height = read->rw.kernel->dst_size;
922  } else if (read && read->rw.filter == SWS_OP_FILTER_H) {
923  fmt->width = read->rw.kernel->dst_size;
924  }
925 }
926 
928 {
929  const SwsOp *op;
930  int ret, idx;
931 
932  for (idx = 0; idx < ops1->num_ops; idx++) {
933  op = &ops1->ops[idx];
934  if (op->op == SWS_OP_FILTER_H || op->op == SWS_OP_FILTER_V)
935  break;
936  }
937 
938  if (idx == ops1->num_ops) {
939  *out_rest = NULL;
940  return 0;
941  }
942 
943  av_assert0(idx > 0);
944  const SwsOp *prev = &ops1->ops[idx - 1];
945 
946  SwsOpList *ops2 = ff_sws_op_list_duplicate(ops1);
947  if (!ops2)
948  return AVERROR(ENOMEM);
949 
950  /**
951  * Not all components may be needed; but we need the ones that *are*
952  * used to be contiguous for the write/read operations. So, first
953  * compress them into a linearly ascending list of components
954  */
955  int nb_planes = 0;
956  SwsSwizzleOp swiz_wr = SWS_SWIZZLE(0, 1, 2, 3);
957  SwsSwizzleOp swiz_rd = SWS_SWIZZLE(0, 1, 2, 3);
958  for (int i = 0; i < 4; i++) {
959  if (SWS_OP_NEEDED(prev, i)) {
960  const int o = nb_planes++;
961  swiz_wr.in[o] = i;
962  swiz_rd.in[i] = o;
963  }
964  }
965 
966  /* Determine metadata for the intermediate format */
967  const SwsPixelType type = op->type;
968  ops2->comps_src = prev->comps;
969  ops2->src.format = get_planar_fmt(type, nb_planes);
970  ops2->src.desc = av_pix_fmt_desc_get(ops2->src.format);
971  get_input_size(ops1, &ops2->src);
972  ops1->dst = ops2->src;
973 
974  for (int i = 0; i < nb_planes; i++)
975  ops1->plane_dst[i] = ops2->plane_src[i] = i;
976 
977  ff_sws_op_list_remove_at(ops1, idx, ops1->num_ops - idx);
978  ff_sws_op_list_remove_at(ops2, 0, idx);
979  op = NULL; /* the above command may invalidate op */
980 
981  if (swiz_wr.mask != SWS_SWIZZLE(0, 1, 2, 3).mask) {
982  ret = ff_sws_op_list_append(ops1, &(SwsOp) {
983  .op = SWS_OP_SWIZZLE,
984  .type = type,
985  .swizzle = swiz_wr,
986  });
987  if (ret < 0)
988  goto fail;
989  }
990 
991  ret = ff_sws_op_list_append(ops1, &(SwsOp) {
992  .op = SWS_OP_WRITE,
993  .type = type,
994  .rw.elems = nb_planes,
995  });
996  if (ret < 0)
997  goto fail;
998 
999  ret = ff_sws_op_list_insert_at(ops2, 0, &(SwsOp) {
1000  .op = SWS_OP_READ,
1001  .type = type,
1002  .rw.elems = nb_planes,
1003  });
1004  if (ret < 0)
1005  goto fail;
1006 
1007  if (swiz_rd.mask != SWS_SWIZZLE(0, 1, 2, 3).mask) {
1008  ret = ff_sws_op_list_insert_at(ops2, 1, &(SwsOp) {
1009  .op = SWS_OP_SWIZZLE,
1010  .type = type,
1011  .swizzle = swiz_rd,
1012  });
1013  if (ret < 0)
1014  goto fail;
1015  }
1016 
1017  ret = ff_sws_op_list_optimize(ops1);
1018  if (ret < 0)
1019  goto fail;
1020 
1021  ret = ff_sws_op_list_optimize(ops2);
1022  if (ret < 0)
1023  goto fail;
1024 
1025  *out_rest = ops2;
1026  return 0;
1027 
1028 fail:
1029  ff_sws_op_list_free(&ops2);
1030  return ret;
1031 }
SWS_OP_READ
@ SWS_OP_READ
Definition: ops.h:50
SWS_PIXEL_U16
@ SWS_PIXEL_U16
Definition: ops.h:36
ff_sws_op_list_free
void ff_sws_op_list_free(SwsOpList **p_ops)
Definition: ops.c:580
AVPixelFormat
AVPixelFormat
Pixel format.
Definition: pixfmt.h:71
SWS_OP_SWIZZLE
@ SWS_OP_SWIZZLE
Definition: ops.h:53
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
SWS_OP_LSHIFT
@ SWS_OP_LSHIFT
Definition: ops.h:58
SWS_OP_UNPACK
@ SWS_OP_UNPACK
Definition: ops.h:56
ff_sws_op_list_duplicate
SwsOpList * ff_sws_op_list_duplicate(const SwsOpList *ops)
Returns a duplicate of ops, or NULL on OOM.
Definition: ops.c:594
SwsSwizzleOp::mask
uint32_t mask
Definition: ops.h:147
SwsOpList::comps_src
SwsComps comps_src
Source component metadata associated with pixel values from each corresponding component (in plane/me...
Definition: ops.h:273
ff_sws_op_list_input
const SwsOp * ff_sws_op_list_input(const SwsOpList *ops)
Returns the input operation for a given op list, or NULL if there is none (e.g.
Definition: ops.c:631
av_pix_fmt_desc_get
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
Definition: pixdesc.c:3456
SwsConst
Definition: ops.h:90
SWS_COMP_ZERO
@ SWS_COMP_ZERO
Definition: ops.h:84
SWS_OP_CLEAR
@ SWS_OP_CLEAR
Definition: ops.h:62
ff_sws_linear_mask
uint32_t ff_sws_linear_mask(const SwsLinearOp c)
Definition: ops.c:719
SwsOp::swizzle
SwsSwizzleOp swizzle
Definition: ops.h:219
SwsLinearOp::m
AVRational m[4][5]
Generalized 5x5 affine transformation: [ Out.x ] = [ A B C D E ] [ Out.y ] = [ F G H I J ] * [ x y z ...
Definition: ops.h:180
SwsOp::convert
SwsConvertOp convert
Definition: ops.h:220
rational.h
int64_t
long long int64_t
Definition: coverity.c:34
ff_sws_op_list_append
int ff_sws_op_list_append(SwsOpList *ops, SwsOp *op)
These will take over ownership of op and set it to {0}, even on failure.
Definition: ops.c:674
mask
int mask
Definition: mediacodecdec_common.c:154
SwsOp::rw
SwsReadWriteOp rw
Definition: ops.h:217
ops.h
SWS_OP_DITHER
@ SWS_OP_DITHER
Definition: ops.h:70
read_bytes
static void read_bytes(const uint8_t *src, float *dst, int src_stride, int dst_stride, int width, int height, float scale)
Definition: vf_nnedi.c:442
b
#define b
Definition: input.c:42
get_input_size
static void get_input_size(const SwsOpList *ops, SwsFormat *fmt)
Definition: ops_optimizer.c:914
ff_sws_op_list_optimize
int ff_sws_op_list_optimize(SwsOpList *ops)
Fuse compatible and eliminate redundant operations, as well as replacing some operations with more ef...
Definition: ops_optimizer.c:333
SWS_PIXEL_U32
@ SWS_PIXEL_U32
Definition: ops.h:37
SWS_OP_TYPE_NB
@ SWS_OP_TYPE_NB
Definition: ops.h:76
FFMAX
#define FFMAX(a, b)
Definition: macros.h:47
ff_sws_pixel_type_size
int ff_sws_pixel_type_size(SwsPixelType type)
Definition: ops.c:68
dummy
static int dummy
Definition: ffplay.c:3751
SWS_MASK_ROW
#define SWS_MASK_ROW(I)
Definition: ops.h:186
SwsPixelType
SwsPixelType
Copyright (C) 2025 Niklas Haas.
Definition: ops.h:33
SwsComps::max
AVRational max[4]
Definition: ops.h:106
SwsOpList::plane_dst
uint8_t plane_dst[4]
Definition: ops.h:262
SWS_PIXEL_F32
@ SWS_PIXEL_F32
Definition: ops.h:38
fail
#define fail()
Definition: checkasm.h:223
SwsOpList::num_ops
int num_ops
Definition: ops.h:256
SWS_MASK_COL
#define SWS_MASK_COL(J)
Definition: ops.h:187
SwsDitherOp
Definition: ops.h:160
AV_PIX_FMT_YUVA444P16
#define AV_PIX_FMT_YUVA444P16
Definition: pixfmt.h:597
SwsOp::c
SwsConst c
Definition: ops.h:223
SwsSwizzleOp
Definition: ops.h:141
ff_sws_pixel_type_is_int
bool ff_sws_pixel_type_is_int(SwsPixelType type)
Definition: ops.c:83
type
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf type
Definition: writing_filters.txt:86
AV_PIX_FMT_GRAY16
#define AV_PIX_FMT_GRAY16
Definition: pixfmt.h:522
av_reduce
int av_reduce(int *dst_num, int *dst_den, int64_t num, int64_t den, int64_t max)
Reduce a fraction.
Definition: rational.c:35
AVRational::num
int num
Numerator.
Definition: rational.h:59
SwsOp::op
SwsOpType op
Definition: ops.h:213
Q
#define Q(q)
SWS_OP_SCALE
@ SWS_OP_SCALE
Definition: ops.h:66
avassert.h
SwsFormat::height
int height
Definition: format.h:78
SWS_OP_NEEDED
#define SWS_OP_NEEDED(op, idx)
Definition: ops.h:88
s
#define s(width, name)
Definition: cbs_vp9.c:198
AV_PIX_FMT_YUV444P16
#define AV_PIX_FMT_YUV444P16
Definition: pixfmt.h:552
SWS_SWIZZLE
#define SWS_SWIZZLE(X, Y, Z, W)
Definition: ops.h:153
SwsComps::min
AVRational min[4]
Definition: ops.h:106
read_chunk
static int read_chunk(AVFormatContext *s)
Definition: dhav.c:173
op
static int op(uint8_t **dst, const uint8_t *dst_end, GetByteContext *gb, int pixel, int count, int *x, int width, int linesize)
Perform decode operation.
Definition: anm.c:76
av_assert0
#define av_assert0(cond)
assert() equivalent, that is always enabled.
Definition: avassert.h:42
SWS_OP_MIN
@ SWS_OP_MIN
Definition: ops.h:64
exact_log2_q
static int exact_log2_q(const AVRational x)
Definition: ops_optimizer.c:226
ff_sws_pixel_expand
static AVRational ff_sws_pixel_expand(SwsPixelType from, SwsPixelType to)
Definition: ops_internal.h:31
SWS_OP_LINEAR
@ SWS_OP_LINEAR
Definition: ops.h:69
op_commute_filter
static bool op_commute_filter(SwsOp *op, SwsOp *prev)
Try to commute a filter op with the previous operation.
Definition: ops_optimizer.c:178
SWS_OP_FILTER_H
@ SWS_OP_FILTER_H
Definition: ops.h:73
AV_PIX_FMT_GRAYF32
#define AV_PIX_FMT_GRAYF32
Definition: pixfmt.h:582
tmp
static uint8_t tmp[40]
Definition: aes_ctr.c:52
FFABS
#define FFABS(a)
Absolute value, Note, INT_MIN / INT64_MIN result in undefined behavior as they are not representable ...
Definition: common.h:74
SWS_OP_PACK
@ SWS_OP_PACK
Definition: ops.h:57
SwsOp::dither
SwsDitherOp dither
Definition: ops.h:221
SwsReadWriteOp::kernel
SwsFilterWeights * kernel
Definition: ops.h:130
NULL
#define NULL
Definition: coverity.c:32
extract_scalar
static bool extract_scalar(const SwsLinearOp *c, SwsComps comps, SwsComps prev, SwsConst *out_scale)
If a linear operation can be reduced to a scalar multiplication, returns the corresponding scaling fa...
Definition: ops_optimizer.c:240
AVRational
Rational number (pair of numerator and denominator).
Definition: rational.h:58
av_unreachable
#define av_unreachable(msg)
Asserts that are used as compiler optimization hints depending upon ASSERT_LEVEL and NBDEBUG.
Definition: avassert.h:116
SwsReadWriteOp::frac
uint8_t frac
Definition: ops.h:119
SWS_COMP_GARBAGE
@ SWS_COMP_GARBAGE
Definition: ops.h:82
SwsConvertOp::to
SwsPixelType to
Definition: ops.h:156
ff_sws_op_list_subpass
int ff_sws_op_list_subpass(SwsOpList *ops1, SwsOpList **out_rest)
Eliminate SWS_OP_FILTER_* operations by merging them with prior SWS_OP_READ operations.
Definition: ops_optimizer.c:927
SWS_OP_FILTER_V
@ SWS_OP_FILTER_V
Definition: ops.h:74
ff_sws_op_list_remove_at
void ff_sws_op_list_remove_at(SwsOpList *ops, int index, int count)
Definition: ops.c:649
RET
#define RET(x)
Copyright (C) 2025 Niklas Haas.
Definition: ops_optimizer.c:28
AV_PIX_FMT_GRAY8
@ AV_PIX_FMT_GRAY8
Y , 8bpp.
Definition: pixfmt.h:81
SWS_MASK
#define SWS_MASK(I, J)
Definition: ops.h:184
c
Undefined Behavior In the C some operations are like signed integer dereferencing freed accessing outside allocated Undefined Behavior must not occur in a C it is not safe even if the output of undefined operations is unused The unsafety may seem nit picking but Optimizing compilers have in fact optimized code on the assumption that no undefined Behavior occurs Optimizing code based on wrong assumptions can and has in some cases lead to effects beyond the output of computations The signed integer overflow problem in speed critical code Code which is highly optimized and works with signed integers sometimes has the problem that often the output of the computation does not c
Definition: undefined.txt:32
ff_sws_apply_op_q
void ff_sws_apply_op_q(const SwsOp *op, AVRational x[4])
Apply an operation to an AVRational.
Definition: ops.c:139
SwsConvertOp::expand
bool expand
Definition: ops.h:157
SwsPackOp::pattern
uint8_t pattern[4]
Packed bits are assumed to be LSB-aligned within the underlying integer type; i.e.
Definition: ops.h:138
SwsConst::q
AVRational q
Definition: ops.h:93
extract_constant_rows
static bool extract_constant_rows(SwsLinearOp *c, SwsComps prev, SwsConst *out_clear)
Definition: ops_optimizer.c:265
dst
uint8_t ptrdiff_t const uint8_t ptrdiff_t int intptr_t intptr_t int int16_t * dst
Definition: dsp.h:87
av_bswap32
#define av_bswap32
Definition: bswap.h:47
i
#define i(width, name, range_min, range_max)
Definition: cbs_h264.c:63
SwsOp::type
SwsPixelType type
Definition: ops.h:214
AV_PIX_FMT_GBRPF32
#define AV_PIX_FMT_GBRPF32
Definition: pixfmt.h:578
ff_sws_op_list_insert_at
int ff_sws_op_list_insert_at(SwsOpList *ops, int index, SwsOp *op)
Definition: ops.c:660
SWS_MASK_DIAG4
@ SWS_MASK_DIAG4
Definition: ops.h:200
size
int size
Definition: twinvq_data.h:10344
SWS_OP_RSHIFT
@ SWS_OP_RSHIFT
Definition: ops.h:59
SwsOp::lin
SwsLinearOp lin
Definition: ops.h:216
SwsOpList::src
SwsFormat src
Definition: ops.h:259
SWS_OP_INVALID
@ SWS_OP_INVALID
Definition: ops.h:47
ff_sws_op_list_update_comps
void ff_sws_op_list_update_comps(SwsOpList *ops)
Infer + propagate known information about components.
Definition: ops.c:297
SwsFormat
Definition: format.h:77
SWS_OP_WRITE
@ SWS_OP_WRITE
Definition: ops.h:51
av_refstruct_ref
void * av_refstruct_ref(void *obj)
Create a new reference to an object managed via this API, i.e.
Definition: refstruct.c:140
AV_PIX_FMT_YUVA444P
@ AV_PIX_FMT_YUVA444P
planar YUV 4:4:4 32bpp, (1 Cr & Cb sample per 1x1 Y & A samples)
Definition: pixfmt.h:174
offset
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf offset
Definition: writing_filters.txt:86
SwsOp::comps
SwsComps comps
Metadata about the operation's input/output components.
Definition: ops.h:233
SwsLinearOp
Definition: ops.h:167
get_planar_fmt
static enum AVPixelFormat get_planar_fmt(SwsPixelType type, int nb_planes)
Determine a suitable intermediate buffer format for a given combination of pixel types and number of ...
Definition: ops_optimizer.c:881
noop
#define noop(a)
Definition: h264chroma_template.c:71
SwsFormat::format
enum AVPixelFormat format
Definition: format.h:80
extract_swizzle
static bool extract_swizzle(SwsLinearOp *op, SwsComps prev, SwsSwizzleOp *out_swiz)
Definition: ops_optimizer.c:293
SwsOpList::ops
SwsOp * ops
Definition: ops.h:255
SwsFormat::desc
const AVPixFmtDescriptor * desc
Definition: format.h:85
av_assert1
#define av_assert1(cond)
assert() equivalent, that does not lie in speed critical code.
Definition: avassert.h:58
SwsConst::q4
AVRational q4[4]
Definition: ops.h:92
ops_internal.h
SwsFormat::width
int width
Definition: format.h:78
SwsOp
Definition: ops.h:212
write_bytes
static void write_bytes(const float *src, uint8_t *dst, int src_stride, int dst_stride, int width, int height, int depth, float scale)
Definition: vf_nnedi.c:484
av_cmp_q
static int av_cmp_q(AVRational a, AVRational b)
Compare two rationals.
Definition: rational.h:89
SwsComps::flags
SwsCompFlags flags[4]
Definition: ops.h:101
ret
ret
Definition: filter_design.txt:187
bswap.h
FFSWAP
#define FFSWAP(type, a, b)
Definition: macros.h:52
SwsOpList::dst
SwsFormat dst
Definition: ops.h:259
SWS_OP_MAX
@ SWS_OP_MAX
Definition: ops.h:65
op_commute_swizzle
static bool op_commute_swizzle(SwsOp *op, SwsOp *next)
Try to commute a swizzle op with the next operation.
Definition: ops_optimizer.c:99
SwsReadWriteOp::filter
SwsOpType filter
Filter kernel to apply to each plane while sampling.
Definition: ops.h:129
SwsComps
Definition: ops.h:100
SwsConst::u
unsigned u
Definition: ops.h:94
AVRational::den
int den
Denominator.
Definition: rational.h:60
SwsReadWriteOp::packed
bool packed
Definition: ops.h:120
AV_PIX_FMT_NONE
@ AV_PIX_FMT_NONE
Definition: pixfmt.h:72
AV_PIX_FMT_GBRAPF32
#define AV_PIX_FMT_GBRAPF32
Definition: pixfmt.h:579
SWS_OP_SWAP_BYTES
@ SWS_OP_SWAP_BYTES
Definition: ops.h:52
ff_sws_solve_shuffle
int ff_sws_solve_shuffle(const SwsOpList *const ops, uint8_t shuffle[], int size, uint8_t clear_val, int *read_bytes, int *write_bytes)
"Solve" an op list into a fixed shuffle mask, with an optional ability to also directly clear the out...
Definition: ops_optimizer.c:777
Windows::Graphics::DirectX::Direct3D11::p
IDirect3DDxgiInterfaceAccess _COM_Outptr_ void ** p
Definition: vsrc_gfxcapture_winrt.hpp:53
av_mul_q
AVRational av_mul_q(AVRational b, AVRational c)
Multiply two rationals.
Definition: rational.c:80
AV_PIX_FMT_YUV444P
@ AV_PIX_FMT_YUV444P
planar YUV 4:4:4, 24bpp, (1 Cr & Cb sample per 1x1 Y samples)
Definition: pixfmt.h:78
SWS_COMP_EXACT
@ SWS_COMP_EXACT
Definition: ops.h:83
SwsReadWriteOp::elems
uint8_t elems
Examples: rgba = 4x u8 packed yuv444p = 3x u8 rgb565 = 1x u16 <- use SWS_OP_UNPACK to unpack monow = ...
Definition: ops.h:118
SwsDitherOp::y_offset
int8_t y_offset[4]
Definition: ops.h:164
scale
static void scale(int *out, const int *in, const int w, const int h, const int shift)
Definition: intra.c:278
av_add_q
AVRational av_add_q(AVRational b, AVRational c)
Add two rationals.
Definition: rational.c:93
SwsSwizzleOp::in
uint8_t in[4]
Definition: ops.h:148
SWS_OP_CONVERT
@ SWS_OP_CONVERT
Definition: ops.h:63
op_commute_clear
static bool op_commute_clear(SwsOp *op, SwsOp *next)
Try to commute a clear op with the next operation.
Definition: ops_optimizer.c:40
SwsOpList::plane_src
uint8_t plane_src[4]
Definition: ops.h:262
SwsOpList
Helper struct for representing a list of operations.
Definition: ops.h:254
av_bswap16
#define av_bswap16
Definition: bswap.h:28
SwsOp::pack
SwsPackOp pack
Definition: ops.h:218
shuffle
static uint64_t shuffle(uint64_t in, const uint8_t *shuffle, int shuffle_len)
Definition: des.c:179
av_log2
int av_log2(unsigned v)
Definition: intmath.c:26
src
#define src
Definition: vp8dsp.c:248
read
static uint32_t BS_FUNC() read(BSCTX *bc, unsigned int n)
Return n bits from the buffer, n has to be in the 0-32 range.
Definition: bitstream_template.h:239
exact_log2
static int exact_log2(const int x)
Definition: ops_optimizer.c:217