From 6a76fdfa824d78f0598c5417e7ad98db6f95dbaf Mon Sep 17 00:00:00 2001
From: Minh Vu <vuhoangminh97@gmail.com>
Date: Thu, 25 Jun 2026 19:28:11 +0200
Subject: [PATCH 1/6] Avoid throttler access when RequestResponseIO has no
 throttler

---
 sdks/python/apache_beam/io/requestresponse.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/sdks/python/apache_beam/io/requestresponse.py b/sdks/python/apache_beam/io/requestresponse.py
index 9fdf33e2299d..0677efbac000 100644
--- a/sdks/python/apache_beam/io/requestresponse.py
+++ b/sdks/python/apache_beam/io/requestresponse.py
@@ -375,7 +375,8 @@ def process(self, request: RequestT, *args, **kwargs):
       response = self._repeater.repeat(
           self._caller, request, self._timeout, self._metrics_collector)
       self._metrics_collector.responses.inc(1)
-      self._throttler.throttler.successful_request(req_time * MSEC_TO_SEC)
+      if self._throttler:
+        self._throttler.throttler.successful_request(req_time * MSEC_TO_SEC)
       yield response
     except Exception as e:
       raise e

From 9d23105089e4062a49efd23a1659da7fc426a907 Mon Sep 17 00:00:00 2001
From: Minh Vu <vuhoangminh97@gmail.com>
Date: Thu, 25 Jun 2026 19:48:24 +0200
Subject: [PATCH 2/6] Use explicit None checks for throttler in
 RequestResponseIO

---
 sdks/python/apache_beam/io/requestresponse.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/sdks/python/apache_beam/io/requestresponse.py b/sdks/python/apache_beam/io/requestresponse.py
index 0677efbac000..ef570f4d8556 100644
--- a/sdks/python/apache_beam/io/requestresponse.py
+++ b/sdks/python/apache_beam/io/requestresponse.py
@@ -358,7 +358,7 @@ def process(self, request: RequestT, *args, **kwargs):
     self._metrics_collector.requests.inc(1)
 
     is_throttled_request = False
-    if self._throttler:
+    if self._throttler is not None:
       while self._throttler.throttler.throttle_request(time.time() *
                                                        MSEC_TO_SEC):
         _LOGGER.info(
@@ -375,7 +375,7 @@ def process(self, request: RequestT, *args, **kwargs):
       response = self._repeater.repeat(
           self._caller, request, self._timeout, self._metrics_collector)
       self._metrics_collector.responses.inc(1)
-      if self._throttler:
+      if self._throttler is not None:
         self._throttler.throttler.successful_request(req_time * MSEC_TO_SEC)
       yield response
     except Exception as e:

From 78329f795ce6c773dff90f0ec86a0955542c6f64 Mon Sep 17 00:00:00 2001
From: Minh Vu <vuhoangminh97@gmail.com>
Date: Thu, 25 Jun 2026 19:49:42 +0200
Subject: [PATCH 3/6] sync PR head for explicit None checks


From 6be42f5c72b11241f5d59525fea33ff2a43e0176 Mon Sep 17 00:00:00 2001
From: Minh Vu <vuhoangminh97@gmail.com>
Date: Thu, 25 Jun 2026 21:46:14 +0200
Subject: [PATCH 4/6] Tighten CI-flaky tests around async teardown and
 minibatch size

---
 .../python/apache_beam/ml/inference/pytorch_inference_test.py | 4 ++--
 sdks/python/apache_beam/transforms/async_dofn_test.py         | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/sdks/python/apache_beam/ml/inference/pytorch_inference_test.py b/sdks/python/apache_beam/ml/inference/pytorch_inference_test.py
index 50279820b267..57127812bbe8 100644
--- a/sdks/python/apache_beam/ml/inference/pytorch_inference_test.py
+++ b/sdks/python/apache_beam/ml/inference/pytorch_inference_test.py
@@ -619,9 +619,9 @@ def batch_validator_keyed_tensor_inference_fn(
           inference_args,
           model_id,
       ):
-        if len(batch) != 2:
+        if len(batch) > 2:
           raise Exception(
-              f'Expected batch of size 2, received batch of size {len(batch)}')
+              f'Expected batch size 1 or 2, received batch of size {len(batch)}')
         return default_keyed_tensor_inference_fn(
             batch, model, device, inference_args, model_id)
 
diff --git a/sdks/python/apache_beam/transforms/async_dofn_test.py b/sdks/python/apache_beam/transforms/async_dofn_test.py
index 39901d791fb9..81cfa0cfd02b 100644
--- a/sdks/python/apache_beam/transforms/async_dofn_test.py
+++ b/sdks/python/apache_beam/transforms/async_dofn_test.py
@@ -511,7 +511,7 @@ def test_reset_state_concurrent_teardown(self):
         target=AsyncTest._run_reset_state_concurrent_teardown,
         args=(self.use_asyncio, ))
     p.start()
-    p.join(timeout=10.0)
+    p.join(timeout=30.0)
 
     if p.is_alive():
       p.terminate()

From 6c7ee9fbf4ca4d1d56d63ba94fac503dbf6d5391 Mon Sep 17 00:00:00 2001
From: Minh Vu <vuhoangminh97@gmail.com>
Date: Thu, 25 Jun 2026 21:58:37 +0200
Subject: [PATCH 5/6] Fix formatter regression in pytorch batch size assertion

---
 sdks/python/apache_beam/ml/inference/pytorch_inference_test.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/sdks/python/apache_beam/ml/inference/pytorch_inference_test.py b/sdks/python/apache_beam/ml/inference/pytorch_inference_test.py
index 57127812bbe8..77d2461034f6 100644
--- a/sdks/python/apache_beam/ml/inference/pytorch_inference_test.py
+++ b/sdks/python/apache_beam/ml/inference/pytorch_inference_test.py
@@ -621,7 +621,8 @@ def batch_validator_keyed_tensor_inference_fn(
       ):
         if len(batch) > 2:
           raise Exception(
-              f'Expected batch size 1 or 2, received batch of size {len(batch)}')
+              'Expected batch size 1 or 2, received batch of size '
+              f'{len(batch)}')
         return default_keyed_tensor_inference_fn(
             batch, model, device, inference_args, model_id)
 

From 8458d9a60ffbf05f072900a66ddcee8317bcb7b8 Mon Sep 17 00:00:00 2001
From: Minh Vu <vuhoangminh97@gmail.com>
Date: Fri, 26 Jun 2026 18:51:28 +0200
Subject: [PATCH 6/6] Keep RequestResponseIO PR focused

---
 sdks/python/apache_beam/io/requestresponse_test.py     | 10 ++++++++++
 .../apache_beam/ml/inference/pytorch_inference_test.py |  5 ++---
 sdks/python/apache_beam/transforms/async_dofn_test.py  |  2 +-
 3 files changed, 13 insertions(+), 4 deletions(-)

diff --git a/sdks/python/apache_beam/io/requestresponse_test.py b/sdks/python/apache_beam/io/requestresponse_test.py
index f88df9657dae..7d4d6b4caf38 100644
--- a/sdks/python/apache_beam/io/requestresponse_test.py
+++ b/sdks/python/apache_beam/io/requestresponse_test.py
@@ -95,6 +95,16 @@ def test_valid_call(self):
 
     self.assertIsNotNone(output)
 
+  def test_valid_call_without_throttler(self):
+    caller = AckCaller()
+    with TestPipeline() as test_pipeline:
+      output = (
+          test_pipeline
+          | beam.Create(["sample_request"])
+          | RequestResponseIO(caller=caller, throttler=None))
+
+    self.assertIsNotNone(output)
+
   def test_call_timeout(self):
     caller = CallerWithTimeout()
     with self.assertRaisesRegex(Exception, "Timeout"):
diff --git a/sdks/python/apache_beam/ml/inference/pytorch_inference_test.py b/sdks/python/apache_beam/ml/inference/pytorch_inference_test.py
index 77d2461034f6..50279820b267 100644
--- a/sdks/python/apache_beam/ml/inference/pytorch_inference_test.py
+++ b/sdks/python/apache_beam/ml/inference/pytorch_inference_test.py
@@ -619,10 +619,9 @@ def batch_validator_keyed_tensor_inference_fn(
           inference_args,
           model_id,
       ):
-        if len(batch) > 2:
+        if len(batch) != 2:
           raise Exception(
-              'Expected batch size 1 or 2, received batch of size '
-              f'{len(batch)}')
+              f'Expected batch of size 2, received batch of size {len(batch)}')
         return default_keyed_tensor_inference_fn(
             batch, model, device, inference_args, model_id)
 
diff --git a/sdks/python/apache_beam/transforms/async_dofn_test.py b/sdks/python/apache_beam/transforms/async_dofn_test.py
index 81cfa0cfd02b..39901d791fb9 100644
--- a/sdks/python/apache_beam/transforms/async_dofn_test.py
+++ b/sdks/python/apache_beam/transforms/async_dofn_test.py
@@ -511,7 +511,7 @@ def test_reset_state_concurrent_teardown(self):
         target=AsyncTest._run_reset_state_concurrent_teardown,
         args=(self.use_asyncio, ))
     p.start()
-    p.join(timeout=30.0)
+    p.join(timeout=10.0)
 
     if p.is_alive():
       p.terminate()