getsentry · untitaker · Aug 31, 2023 · Jun 29, 2023 · Jun 29, 2023 · Jun 29, 2023
@@ -309,6 +309,21 @@ class RunTaskWithMultiprocessing(
         ``arroyo.strategies.run_task_with_multiprocessing.batch.output.overflow``
         metric is incremented.
 
+    :param resize_input_blocks: Experimental feature, whether input blocks
+        should be dynamically resized if they end up being too small for batches.
+        This can technically cause unbounded memory consumption and it is
+        recommended to also configure `max_input_block_size` if this option is
+        used.
+
+    :param resize_output_blocks: Experimental feature, same as
+        `resize_input_blocks` but for the output blocks.
+
+    :param max_input_block_size: If automatic resizing is enabled, this sets an
+        upper limit on how large those blocks can get.
+
+    :param max_output_block_size: Same as `max_input_block_size` but for output
+        blocks.
+
     :param initializer: A function to run at the beginning of each subprocess.
 
         Subprocesses are spawned without any of the state of the parent
@@ -413,13 +428,22 @@ def __init__(
         max_batch_time: float,
         input_block_size: int,
         output_block_size: int,
+        resize_input_blocks: bool = False,
+        resize_output_blocks: bool = False,
+        max_input_block_size: Optional[int] = None,
+        max_output_block_size: Optional[int] = None,
         initializer: Optional[Callable[[], None]] = None,
     ) -> None:
         self.__transform_function = function
         self.__next_step = next_step
         self.__max_batch_size = max_batch_size
         self.__max_batch_time = max_batch_time
 
+        self.__resize_input_blocks = resize_input_blocks
+        self.__resize_output_blocks = resize_output_blocks
+        self.__max_input_block_size = max_input_block_size
+        self.__max_output_block_size = max_output_block_size
+
         self.__shared_memory_manager = SharedMemoryManager()
         self.__shared_memory_manager.start()
 
@@ -454,6 +478,8 @@ def __init__(
                     ]
                 ],
                 AsyncResult[ParallelRunTaskResult[TResult]],
+                bool,  # was the input block too small?
+                bool,  # was the output block too small?
             ]
         ] = deque()
         self.__invalid_messages = InvalidMessageState()
@@ -481,7 +507,7 @@ def handle_sigchld(signum: int, frame: Any) -> None:
 
         signal.signal(signal.SIGCHLD, handle_sigchld)
 
-    def __submit_batch(self) -> None:
+    def __submit_batch(self, input_block_too_small: bool) -> None:
         assert self.__batch_builder is not None
         batch = self.__batch_builder.build()
         logger.debug("Submitting %r to %r...", batch, self.__pool)
@@ -492,6 +518,8 @@ def __submit_batch(self) -> None:
                     parallel_run_task_worker_apply,
                     (self.__transform_function, batch, self.__output_blocks.pop()),
                 ),
+                input_block_too_small,
+                False,
             )
         )
         self.__batches_in_progress.increment()
@@ -547,7 +575,12 @@ def __check_for_results(self, timeout: Optional[float] = None) -> None:
                 self.__pool_waiting_time = None
 
     def __check_for_results_impl(self, timeout: Optional[float] = None) -> None:
-        input_batch, async_result = self.__processes[0]
+        (
+            input_batch,
+            async_result,
+            input_block_too_small,
+            output_block_too_small,
+        ) = self.__processes[0]
 
         # If this call is being made in a context where it is intended to be
         # nonblocking, checking if the result is ready (rather than trying to
@@ -559,6 +592,15 @@ def __check_for_results_impl(self, timeout: Optional[float] = None) -> None:
 
         result = async_result.get(timeout=timeout)
 
+        self.__metrics.timing(
+            "arroyo.strategies.run_task_with_multiprocessing.output_batch.size.msg",
+            len(result.valid_messages_transformed),
+        )
+        self.__metrics.timing(
+            "arroyo.strategies.run_task_with_multiprocessing.output_batch.size.bytes",
+            result.valid_messages_transformed.get_content_size(),
+        )
+
         for idx, message in result.valid_messages_transformed:
             if isinstance(message, InvalidMessage):
                 # For the next invocation of __check_for_results, skip over this message
@@ -604,12 +646,54 @@ def __check_for_results_impl(self, timeout: Optional[float] = None) -> None:
                         result.next_index_to_process,
                     ),
                 ),
+                input_block_too_small,
+                True,
             )
             return
 
+        old_input_block = input_batch.block
+
+        if (
+            input_block_too_small
+            and self.__resize_input_blocks
+            and (
+                self.__max_input_block_size is None
+                or self.__max_input_block_size > old_input_block.size * 2
+            )
+        ):
+            self.__metrics.increment(
+                "arroyo.strategies.run_task_with_multiprocessing.batch.input.resize"
+            )
+            new_input_block = self.__shared_memory_manager.SharedMemory(
+                old_input_block.size * 2
+            )
+            old_input_block.unlink()
+        else:
+            new_input_block = old_input_block
+
+        old_output_block = result.valid_messages_transformed.block
+
+        if (
+            output_block_too_small
+            and self.__resize_output_blocks
+            and (
+                self.__max_output_block_size is None
+                or self.__max_output_block_size > old_output_block.size * 2
+            )
+        ):
+            self.__metrics.increment(
+                "arroyo.strategies.run_task_with_multiprocessing.batch.output.resize"
+            )
+            new_output_block = self.__shared_memory_manager.SharedMemory(
+                old_output_block.size * 2
+            )
+            old_output_block.unlink()
+        else:
+            new_output_block = old_output_block
+
         logger.debug("Completed %r, reclaiming blocks...", input_batch)
-        self.__input_blocks.append(input_batch.block)
-        self.__output_blocks.append(result.valid_messages_transformed.block)
+        self.__input_blocks.append(new_input_block)
+        self.__output_blocks.append(new_output_block)
         self.__batches_in_progress.decrement()
 
         del self.__processes[0]
@@ -621,7 +705,7 @@ def poll(self) -> None:
         self.__check_for_results(timeout=0)
 
         if self.__batch_builder is not None and self.__batch_builder.ready():
-            self.__submit_batch()
+            self.__submit_batch(False)
 
     def __reset_batch_builder(self) -> None:
         try:
@@ -651,7 +735,7 @@ def submit(
             self.__metrics.increment(
                 "arroyo.strategies.run_task_with_multiprocessing.batch.input.overflow"
             )
-            self.__submit_batch()
+            self.__submit_batch(True)
 
             # This may raise ``MessageRejected`` (if all of the shared memory
             # is in use) and create backpressure.
@@ -667,7 +751,7 @@ def close(self) -> None:
         self.__closed = True
 
         if self.__batch_builder is not None and len(self.__batch_builder) > 0:
-            self.__submit_batch()
+            self.__submit_batch(False)
 
     def terminate(self) -> None:
         self.__closed = True

@@ -5,6 +5,10 @@
     "arroyo.strategies.run_task_with_multiprocessing.batch.size.msg",
     # Number of bytes in a multiprocessing batch
     "arroyo.strategies.run_task_with_multiprocessing.batch.size.bytes",
+    # Number of messages in a multiprocessing batch after the message transformation
+    "arroyo.strategies.run_task_with_multiprocessing.output_batch.size.msg",
+    # Number of bytes in a multiprocessing batch after the message transformation
+    "arroyo.strategies.run_task_with_multiprocessing.output_batch.size.bytes",
     # Number of times the consumer is spinning
     "arroyo.consumer.run.count",
     # How long it took the Reduce step to fill up a batch
@@ -22,6 +26,14 @@
     # This can be devastating for throughput. Increase `output_block_size` to
     # fix.
     "arroyo.strategies.run_task_with_multiprocessing.batch.output.overflow",
+    # Arroyo has decided to re-allocate a block in order to combat input buffer
+    # overflow. This can be enabled or disabled using `resize_input_blocks`
+    # setting.
+    "arroyo.strategies.run_task_with_multiprocessing.batch.input.resize",
+    # Arroyo has decided to re-allocate a block in order to combat output buffer
+    # overflow. This can be enabled or disabled using `resize_output_blocks`
+    # setting.
+    "arroyo.strategies.run_task_with_multiprocessing.batch.output.resize",
     # How many batches are being processed in parallel by multiprocessing.
     "arroyo.strategies.run_task_with_multiprocessing.batches_in_progress",
     # Counter. A subprocess by multiprocessing unexpectedly died.