Highbd D45E intrapred SSE2/AVX2 speedup
Function SSE2 vs C AVX2 vs C
4x4 ~4.5x
4x8 ~4.5x
8x4 ~11.7x
8x8 ~12.7x
8x16 ~14.0x
16x8 ~21.7x
16x16 ~24.0x
16x32 ~28.7x
32x16 ~20.5x
32x32 ~24.4x
Change-Id: Iaca49727d8df17b7f793b774a8d51a401ef8a8d1
diff --git a/aom_dsp/aom_dsp.cmake b/aom_dsp/aom_dsp.cmake
index dc8d24a..11b55ca 100644
--- a/aom_dsp/aom_dsp.cmake
+++ b/aom_dsp/aom_dsp.cmake
@@ -246,6 +246,7 @@
set(AOM_DSP_COMMON_INTRIN_AVX2
${AOM_DSP_COMMON_INTRIN_AVX2}
"${AOM_ROOT}/aom_dsp/x86/highbd_convolve_avx2.c"
+ "${AOM_ROOT}/aom_dsp/x86/highbd_intrapred_avx2.c"
"${AOM_ROOT}/aom_dsp/x86/highbd_loopfilter_avx2.c")
else ()
set(AOM_DSP_COMMON_INTRIN_DSPR2