28 #define randomize_buffer(buf, size) do { \
30 for (i = 0; i < size / 4; i++) \
31 ((uint32_t *)buf)[i] = rnd(); \
49 const int ii_w =
w + e*2;
50 const int ii_h =
h + e*2;
51 const int ii_lz_32 =
FFALIGN(ii_w + 1, 4);
52 uint32_t *ii_orig_ref =
av_calloc(ii_h + 1, ii_lz_32 *
sizeof(*ii_orig_ref));
53 uint32_t *ii_ref = ii_orig_ref + ii_lz_32 + 1;
54 uint32_t *ii_orig_new =
av_calloc(ii_h + 1, ii_lz_32 *
sizeof(*ii_orig_new));
55 uint32_t *ii_new = ii_orig_new + ii_lz_32 + 1;
60 const uint8_t *s1, ptrdiff_t linesize1,
61 const uint8_t *s2, ptrdiff_t linesize2,
66 for (offy = -
r; offy <=
r; offy++) {
67 for (offx = -
r; offx <=
r; offx++) {
71 const int s2x = e + offx;
72 const int s2y = e + offy;
73 const int startx_safe =
FFMAX(s1x, s2x);
74 const int starty_safe =
FFMAX(s1y, s2y);
75 const int u_endx_safe =
FFMIN(s1x +
w, s2x +
w);
76 const int endy_safe =
FFMIN(s1y +
h, s2y +
h);
77 const int safe_pw = (u_endx_safe - startx_safe) & ~0
xf;
78 const int safe_ph = endy_safe - starty_safe;
86 memset(ii_ref, 0, (ii_lz_32 * ii_h - 1) *
sizeof(*ii_ref));
87 memset(ii_new, 0, (ii_lz_32 * ii_h - 1) *
sizeof(*ii_new));
89 call_ref(ii_ref + starty_safe*ii_lz_32 + startx_safe, ii_lz_32,
90 src + (starty_safe - s1y) * src_lz + (startx_safe - s1x), src_lz,
91 src + (starty_safe - s2y) * src_lz + (startx_safe - s2x), src_lz,
93 call_new(ii_new + starty_safe*ii_lz_32 + startx_safe, ii_lz_32,
94 src + (starty_safe - s1y) * src_lz + (startx_safe - s1x), src_lz,
95 src + (starty_safe - s2y) * src_lz + (startx_safe - s2x), src_lz,
98 if (memcmp(ii_ref, ii_new, (ii_lz_32 * ii_h - 1) *
sizeof(*ii_ref)))
101 memset(ii_new, 0, (ii_lz_32 * ii_h - 1) *
sizeof(*ii_new));
102 bench_new(ii_new + starty_safe*ii_lz_32 + startx_safe, ii_lz_32,
103 src + (starty_safe - s1y) * src_lz + (startx_safe - s1x), src_lz,
104 src + (starty_safe - s2y) * src_lz + (startx_safe - s2x), src_lz,
117 #define MAX_MEANINGFUL_DIFF 255
119 const int endx = 200;
134 const uint32_t *
const iib,
135 const uint32_t *
const iid,
136 const uint32_t *
const iie,
137 const uint8_t *
const src,
140 const float *
const weight_lut,
141 ptrdiff_t max_meaningful_diff,
164 iie[
i] = iia[
i] + (iib[
i] - iia[
i]) + (iid[
i] - iia[
i]) +
diff;
168 memset(tw_ref, 0, (
TEST_W + 16) *
sizeof(
float));
169 memset(tw_new, 0, (
TEST_W + 16) *
sizeof(
float));
170 memset(sum_ref, 0, (
TEST_W + 16) *
sizeof(
float));
171 memset(sum_new, 0, (
TEST_W + 16) *
sizeof(
float));
173 call_ref(iia, iib, iid, iie,
src, tw_ref, sum_ref, lut,
175 call_new(iia, iib, iid, iie,
src, tw_new, sum_new, lut,
185 memset(tw_new, 0, (
TEST_W + 16) *
sizeof(
float));
186 memset(sum_new, 0, (
TEST_W + 16) *
sizeof(
float));
187 bench_new(iia, iib, iid, iie,
src, tw_new, sum_new, lut,