Fix wrong stride of dst buffer in intra4x4

Change-Id: Icbd238c73323d11d60ca4da755b52c83cb11b8b5
diff --git a/av1/encoder/rdopt.c b/av1/encoder/rdopt.c
index 373af79..e139eab 100644
--- a/av1/encoder/rdopt.c
+++ b/av1/encoder/rdopt.c
@@ -2006,7 +2006,7 @@
   const int src_stride = p->src.stride;
   const int dst_stride = pd->dst.stride;
   const uint8_t *src_init = &p->src.buf[row * 4 * src_stride + col * 4];
-  uint8_t *dst_init = &pd->dst.buf[row * 4 * src_stride + col * 4];
+  uint8_t *dst_init = &pd->dst.buf[row * 4 * dst_stride + col * 4];
 #if CONFIG_CB4X4
   // TODO(jingning): This is a temporal change. The whole function should be
   // out when cb4x4 is enabled.