AVX2 implementation for highbd_convolve_2d

Can be up to >10% faster with bit exact results

Change-Id: I5f169673fd2d5af96f425f00d862f3c989228d2e
diff --git a/av1/av1_common.mk b/av1/av1_common.mk
index 5e7dca6..5d3c51e 100644
--- a/av1/av1_common.mk
+++ b/av1/av1_common.mk
@@ -167,6 +167,7 @@
 AV1_COMMON_SRCS-$(HAVE_AVX2) += common/x86/convolve_2d_avx2.c
 ifeq ($(CONFIG_HIGHBITDEPTH),yes)
 AV1_COMMON_SRCS-$(HAVE_SSSE3) += common/x86/highbd_convolve_2d_ssse3.c
+AV1_COMMON_SRCS-$(HAVE_AVX2) += common/x86/highbd_convolve_2d_avx2.c
 endif
 endif