Improve pack bitstream multi-thread performance

This CL improves pack bitstream multi-thread performance by
accounting setup time overhead and job dispatch time overhead for
the number of tiles and available number of workers.

Change-Id: I98e4b0df684e40262ce87ccde24522d98080a825
diff --git a/av1/encoder/ethread.c b/av1/encoder/ethread.c
index 3a011e9..a4fe355 100644
--- a/av1/encoder/ethread.c
+++ b/av1/encoder/ethread.c
@@ -2074,9 +2074,8 @@
     struct aom_write_bit_buffer *saved_wb, uint8_t obu_extn_header,
     const FrameHeaderInfo *fh_info, int *const largest_tile_id,
     unsigned int *max_tile_size, uint32_t *const obu_header_size,
-    uint8_t **tile_data_start) {
+    uint8_t **tile_data_start, const int num_workers) {
   MultiThreadInfo *const mt_info = &cpi->mt_info;
-  const int num_workers = mt_info->num_mod_workers[MOD_PACK_BS];
 
   PackBSParams pack_bs_params[MAX_TILES];
   uint32_t tile_size[MAX_TILES] = { 0 };