blob: 3827b65faea594f0d10071700d19853c0f0dae6d [file] [log] [blame]
Sarah Parker4dc0f1b2016-08-09 17:40:53 -07001/*
Yaowu Xubde4ac82016-11-28 15:26:06 -08002 * Copyright (c) 2016, Alliance for Open Media. All rights reserved
Sarah Parker4dc0f1b2016-08-09 17:40:53 -07003 *
Yaowu Xubde4ac82016-11-28 15:26:06 -08004 * This source code is subject to the terms of the BSD 2 Clause License and
5 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6 * was not distributed with this source code in the LICENSE file, you can
7 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8 * Media Patent License 1.0 was not distributed with this source code in the
9 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
Sarah Parker4dc0f1b2016-08-09 17:40:53 -070010 */
11
Sarah Parker4dc0f1b2016-08-09 17:40:53 -070012#include <stdlib.h>
13#include <memory.h>
14#include <math.h>
15
David Barkeree674322017-05-10 15:43:02 +010016#include "./av1_rtcd.h"
Yaowu Xuf883b422016-08-30 14:01:10 -070017#include "av1/encoder/corner_match.h"
Sarah Parker4dc0f1b2016-08-09 17:40:53 -070018
Sarah Parker4dc0f1b2016-08-09 17:40:53 -070019#define SEARCH_SZ 9
20#define SEARCH_SZ_BY2 ((SEARCH_SZ - 1) / 2)
21
Yue Chen19e7aa82016-11-30 14:05:39 -080022#define THRESHOLD_NCC 0.75
Sarah Parker4dc0f1b2016-08-09 17:40:53 -070023
David Barker15338d52017-02-13 15:30:59 +000024/* Compute var(im) * MATCH_SZ_SQ over a MATCH_SZ by MATCH_SZ window of im,
25 centered at (x, y).
26*/
27static double compute_variance(unsigned char *im, int stride, int x, int y) {
Yaowu Xufc4585b2017-05-05 11:18:22 -070028 int sum = 0;
29 int sumsq = 0;
David Barker15338d52017-02-13 15:30:59 +000030 int var;
Sarah Parker4dc0f1b2016-08-09 17:40:53 -070031 int i, j;
32 for (i = 0; i < MATCH_SZ; ++i)
33 for (j = 0; j < MATCH_SZ; ++j) {
34 sum += im[(i + y - MATCH_SZ_BY2) * stride + (j + x - MATCH_SZ_BY2)];
35 sumsq += im[(i + y - MATCH_SZ_BY2) * stride + (j + x - MATCH_SZ_BY2)] *
36 im[(i + y - MATCH_SZ_BY2) * stride + (j + x - MATCH_SZ_BY2)];
37 }
David Barker15338d52017-02-13 15:30:59 +000038 var = sumsq * MATCH_SZ_SQ - sum * sum;
39 return (double)var;
Sarah Parker4dc0f1b2016-08-09 17:40:53 -070040}
41
David Barker15338d52017-02-13 15:30:59 +000042/* Compute corr(im1, im2) * MATCH_SZ * stddev(im1), where the
43 correlation/standard deviation are taken over MATCH_SZ by MATCH_SZ windows
44 of each image, centered at (x1, y1) and (x2, y2) respectively.
45*/
David Barkeree674322017-05-10 15:43:02 +010046double compute_cross_correlation_c(unsigned char *im1, int stride1, int x1,
47 int y1, unsigned char *im2, int stride2,
48 int x2, int y2) {
David Barker15338d52017-02-13 15:30:59 +000049 int v1, v2;
50 int sum1 = 0;
51 int sum2 = 0;
52 int sumsq2 = 0;
53 int cross = 0;
54 int var2, cov;
Sarah Parker4dc0f1b2016-08-09 17:40:53 -070055 int i, j;
56 for (i = 0; i < MATCH_SZ; ++i)
57 for (j = 0; j < MATCH_SZ; ++j) {
David Barker15338d52017-02-13 15:30:59 +000058 v1 = im1[(i + y1 - MATCH_SZ_BY2) * stride1 + (j + x1 - MATCH_SZ_BY2)];
59 v2 = im2[(i + y2 - MATCH_SZ_BY2) * stride2 + (j + x2 - MATCH_SZ_BY2)];
60 sum1 += v1;
61 sum2 += v2;
62 sumsq2 += v2 * v2;
63 cross += v1 * v2;
Sarah Parker4dc0f1b2016-08-09 17:40:53 -070064 }
David Barker15338d52017-02-13 15:30:59 +000065 var2 = sumsq2 * MATCH_SZ_SQ - sum2 * sum2;
66 cov = cross * MATCH_SZ_SQ - sum1 * sum2;
67 return cov / sqrt((double)var2);
Sarah Parker4dc0f1b2016-08-09 17:40:53 -070068}
69
David Barker15338d52017-02-13 15:30:59 +000070static int is_eligible_point(int pointx, int pointy, int width, int height) {
Sarah Parker4dc0f1b2016-08-09 17:40:53 -070071 return (pointx >= MATCH_SZ_BY2 && pointy >= MATCH_SZ_BY2 &&
72 pointx + MATCH_SZ_BY2 < width && pointy + MATCH_SZ_BY2 < height);
73}
74
David Barker15338d52017-02-13 15:30:59 +000075static int is_eligible_distance(int point1x, int point1y, int point2x,
76 int point2y, int width, int height) {
Sarah Parker4dc0f1b2016-08-09 17:40:53 -070077 const int thresh = (width < height ? height : width) >> 4;
78 return ((point1x - point2x) * (point1x - point2x) +
79 (point1y - point2y) * (point1y - point2y)) <= thresh * thresh;
80}
81
82static void improve_correspondence(unsigned char *frm, unsigned char *ref,
83 int width, int height, int frm_stride,
84 int ref_stride,
Sarah Parkerf9a961c2016-09-06 11:25:04 -070085 Correspondence *correspondences,
Sarah Parker4dc0f1b2016-08-09 17:40:53 -070086 int num_correspondences) {
87 int i;
88 for (i = 0; i < num_correspondences; ++i) {
Sarah Parker4dc0f1b2016-08-09 17:40:53 -070089 int x, y, best_x = 0, best_y = 0;
90 double best_match_ncc = 0.0;
91 for (y = -SEARCH_SZ_BY2; y <= SEARCH_SZ_BY2; ++y) {
92 for (x = -SEARCH_SZ_BY2; x <= SEARCH_SZ_BY2; ++x) {
93 double match_ncc;
David Barker15338d52017-02-13 15:30:59 +000094 if (!is_eligible_point(correspondences[i].rx + x,
95 correspondences[i].ry + y, width, height))
Sarah Parker4dc0f1b2016-08-09 17:40:53 -070096 continue;
David Barker15338d52017-02-13 15:30:59 +000097 if (!is_eligible_distance(correspondences[i].x, correspondences[i].y,
98 correspondences[i].rx + x,
99 correspondences[i].ry + y, width, height))
Sarah Parker4dc0f1b2016-08-09 17:40:53 -0700100 continue;
Sarah Parker4dc0f1b2016-08-09 17:40:53 -0700101 match_ncc = compute_cross_correlation(
David Barker15338d52017-02-13 15:30:59 +0000102 frm, frm_stride, correspondences[i].x, correspondences[i].y, ref,
103 ref_stride, correspondences[i].rx + x, correspondences[i].ry + y);
Sarah Parker4dc0f1b2016-08-09 17:40:53 -0700104 if (match_ncc > best_match_ncc) {
105 best_match_ncc = match_ncc;
106 best_y = y;
107 best_x = x;
108 }
109 }
110 }
David Barker15338d52017-02-13 15:30:59 +0000111 correspondences[i].rx += best_x;
112 correspondences[i].ry += best_y;
Sarah Parker4dc0f1b2016-08-09 17:40:53 -0700113 }
114 for (i = 0; i < num_correspondences; ++i) {
Sarah Parker4dc0f1b2016-08-09 17:40:53 -0700115 int x, y, best_x = 0, best_y = 0;
116 double best_match_ncc = 0.0;
117 for (y = -SEARCH_SZ_BY2; y <= SEARCH_SZ_BY2; ++y)
118 for (x = -SEARCH_SZ_BY2; x <= SEARCH_SZ_BY2; ++x) {
119 double match_ncc;
David Barker15338d52017-02-13 15:30:59 +0000120 if (!is_eligible_point(correspondences[i].x + x,
121 correspondences[i].y + y, width, height))
Sarah Parker4dc0f1b2016-08-09 17:40:53 -0700122 continue;
David Barker15338d52017-02-13 15:30:59 +0000123 if (!is_eligible_distance(
124 correspondences[i].x + x, correspondences[i].y + y,
125 correspondences[i].rx, correspondences[i].ry, width, height))
Sarah Parker4dc0f1b2016-08-09 17:40:53 -0700126 continue;
David Barker15338d52017-02-13 15:30:59 +0000127 match_ncc = compute_cross_correlation(
128 ref, ref_stride, correspondences[i].rx, correspondences[i].ry, frm,
129 frm_stride, correspondences[i].x + x, correspondences[i].y + y);
Sarah Parker4dc0f1b2016-08-09 17:40:53 -0700130 if (match_ncc > best_match_ncc) {
131 best_match_ncc = match_ncc;
132 best_y = y;
133 best_x = x;
134 }
135 }
136 correspondences[i].x += best_x;
137 correspondences[i].y += best_y;
138 }
139}
140
141int determine_correspondence(unsigned char *frm, int *frm_corners,
142 int num_frm_corners, unsigned char *ref,
143 int *ref_corners, int num_ref_corners, int width,
144 int height, int frm_stride, int ref_stride,
David Barker15338d52017-02-13 15:30:59 +0000145 int *correspondence_pts) {
Sarah Parker4dc0f1b2016-08-09 17:40:53 -0700146 // TODO(sarahparker) Improve this to include 2-way match
147 int i, j;
Sarah Parkerf9a961c2016-09-06 11:25:04 -0700148 Correspondence *correspondences = (Correspondence *)correspondence_pts;
Sarah Parker4dc0f1b2016-08-09 17:40:53 -0700149 int num_correspondences = 0;
150 for (i = 0; i < num_frm_corners; ++i) {
151 double best_match_ncc = 0.0;
152 double template_norm;
153 int best_match_j = -1;
154 if (!is_eligible_point(frm_corners[2 * i], frm_corners[2 * i + 1], width,
155 height))
156 continue;
Sarah Parker4dc0f1b2016-08-09 17:40:53 -0700157 for (j = 0; j < num_ref_corners; ++j) {
158 double match_ncc;
Sarah Parker4dc0f1b2016-08-09 17:40:53 -0700159 if (!is_eligible_point(ref_corners[2 * j], ref_corners[2 * j + 1], width,
160 height))
161 continue;
162 if (!is_eligible_distance(frm_corners[2 * i], frm_corners[2 * i + 1],
163 ref_corners[2 * j], ref_corners[2 * j + 1],
164 width, height))
165 continue;
David Barker15338d52017-02-13 15:30:59 +0000166 match_ncc = compute_cross_correlation(
167 frm, frm_stride, frm_corners[2 * i], frm_corners[2 * i + 1], ref,
168 ref_stride, ref_corners[2 * j], ref_corners[2 * j + 1]);
Sarah Parker4dc0f1b2016-08-09 17:40:53 -0700169 if (match_ncc > best_match_ncc) {
170 best_match_ncc = match_ncc;
171 best_match_j = j;
172 }
173 }
David Barker15338d52017-02-13 15:30:59 +0000174 // Note: We want to test if the best correlation is >= THRESHOLD_NCC,
175 // but need to account for the normalization in compute_cross_correlation.
176 template_norm = compute_variance(frm, frm_stride, frm_corners[2 * i],
177 frm_corners[2 * i + 1]);
178 if (best_match_ncc > THRESHOLD_NCC * sqrt(template_norm)) {
179 correspondences[num_correspondences].x = frm_corners[2 * i];
180 correspondences[num_correspondences].y = frm_corners[2 * i + 1];
181 correspondences[num_correspondences].rx = ref_corners[2 * best_match_j];
Sarah Parker4dc0f1b2016-08-09 17:40:53 -0700182 correspondences[num_correspondences].ry =
David Barker15338d52017-02-13 15:30:59 +0000183 ref_corners[2 * best_match_j + 1];
Sarah Parker4dc0f1b2016-08-09 17:40:53 -0700184 num_correspondences++;
185 }
186 }
187 improve_correspondence(frm, ref, width, height, frm_stride, ref_stride,
188 correspondences, num_correspondences);
189 return num_correspondences;
190}