Num failed inferences (#23830)

BjornPrime · web-flow · commit 92cef32915c4 · 2022-11-10T15:30:37.000-05:00
* created test_increment_num_failed_inferences and test_num_failed_inferences_no_failures

* added assertRaises to test_increment_num_failed_inferences

* added num_failed_inferences to _MetricsCollector

* changed error handling and update() implementation

* updated metric name in tests

* removed unnecessary else blocking

* removed unnecessary inference_args from test_increment_failed_batches_counter()

* changed final test_increment_failed_batches_counter assertion

* clarified error handling and updated failed_batches_counter initialization

* decreased examples array length to 1 to ensure repeatability

* troubleshooting tests

* trying to get test_increment_failed_batches_counter to fail as expected

* corrected assertion details

* simplified assertRaises and added reminder comment to assertEqual counter

* lint test

* lint test passed, resetting pre-commit-config.yaml

* fixed lingering linting issues

* shortened comment line to comply with linting

* formatter worked its magic
diff --git a/sdks/python/apache_beam/examples/snippets/transforms/aggregation/groupby_test.py b/sdks/python/apache_beam/examples/snippets/transforms/aggregation/groupby_test.py
@@ -82,7 +82,8 @@ def test_groupby_expr(self):
     with beam.Pipeline() as p:
       grouped = (
           p
-          | beam.Create(['strawberry', 'raspberry', 'blueberry', 'blackberry', 'banana'])
+          | beam.Create(
+              ['strawberry', 'raspberry', 'blueberry', 'blackberry', 'banana'])
           | beam.GroupBy(lambda s: s[0]))
       # [END groupby_expr]
 
@@ -101,8 +102,10 @@ def test_groupby_two_exprs(self):
     with beam.Pipeline() as p:
       grouped = (
           p
-          | beam.Create(['strawberry', 'raspberry', 'blueberry', 'blackberry', 'banana'])
-          | beam.GroupBy(letter=lambda s: s[0], is_berry=lambda s: 'berry' in s))
+          | beam.Create(
+              ['strawberry', 'raspberry', 'blueberry', 'blackberry', 'banana'])
+          | beam.GroupBy(
+              letter=lambda s: s[0], is_berry=lambda s: 'berry' in s))
       # [END groupby_two_exprs]
 
       expected = [
@@ -123,18 +126,44 @@ def test_group_by_attr(self):
 
       expected = [
           #[START groupby_attr_result]
-          ('pie',
-            [
-                beam.Row(recipe='pie', fruit='strawberry', quantity=3, unit_price=1.50),
-                beam.Row(recipe='pie', fruit='raspberry', quantity=1, unit_price=3.50),
-                beam.Row(recipe='pie', fruit='blackberry', quantity=1, unit_price=4.00),
-                beam.Row(recipe='pie', fruit='blueberry', quantity=1, unit_price=2.00),
-            ]),
-          ('muffin',
-            [
-                beam.Row(recipe='muffin', fruit='blueberry', quantity=2, unit_price=2.00),
-                beam.Row(recipe='muffin', fruit='banana', quantity=3, unit_price=1.00),
-            ]),
+          (
+              'pie',
+              [
+                  beam.Row(
+                      recipe='pie',
+                      fruit='strawberry',
+                      quantity=3,
+                      unit_price=1.50),
+                  beam.Row(
+                      recipe='pie',
+                      fruit='raspberry',
+                      quantity=1,
+                      unit_price=3.50),
+                  beam.Row(
+                      recipe='pie',
+                      fruit='blackberry',
+                      quantity=1,
+                      unit_price=4.00),
+                  beam.Row(
+                      recipe='pie',
+                      fruit='blueberry',
+                      quantity=1,
+                      unit_price=2.00),
+              ]),
+          (
+              'muffin',
+              [
+                  beam.Row(
+                      recipe='muffin',
+                      fruit='blueberry',
+                      quantity=2,
+                      unit_price=2.00),
+                  beam.Row(
+                      recipe='muffin',
+                      fruit='banana',
+                      quantity=3,
+                      unit_price=1.00),
+              ]),
           #[END groupby_attr_result]
       ]
       assert_that(grouped | beam.MapTuple(normalize_kv), equal_to(expected))
@@ -149,21 +178,48 @@ def test_group_by_attr_expr(self):
 
       expected = [
           #[START groupby_attr_expr_result]
-          (NamedTuple(recipe='pie', is_berry=True),
-            [
-                beam.Row(recipe='pie', fruit='strawberry', quantity=3, unit_price=1.50),
-                beam.Row(recipe='pie', fruit='raspberry', quantity=1, unit_price=3.50),
-                beam.Row(recipe='pie', fruit='blackberry', quantity=1, unit_price=4.00),
-                beam.Row(recipe='pie', fruit='blueberry', quantity=1, unit_price=2.00),
-            ]),
-          (NamedTuple(recipe='muffin', is_berry=True),
-            [
-                beam.Row(recipe='muffin', fruit='blueberry', quantity=2, unit_price=2.00),
-            ]),
-          (NamedTuple(recipe='muffin', is_berry=False),
-            [
-                beam.Row(recipe='muffin', fruit='banana', quantity=3, unit_price=1.00),
-            ]),
+          (
+              NamedTuple(recipe='pie', is_berry=True),
+              [
+                  beam.Row(
+                      recipe='pie',
+                      fruit='strawberry',
+                      quantity=3,
+                      unit_price=1.50),
+                  beam.Row(
+                      recipe='pie',
+                      fruit='raspberry',
+                      quantity=1,
+                      unit_price=3.50),
+                  beam.Row(
+                      recipe='pie',
+                      fruit='blackberry',
+                      quantity=1,
+                      unit_price=4.00),
+                  beam.Row(
+                      recipe='pie',
+                      fruit='blueberry',
+                      quantity=1,
+                      unit_price=2.00),
+              ]),
+          (
+              NamedTuple(recipe='muffin', is_berry=True),
+              [
+                  beam.Row(
+                      recipe='muffin',
+                      fruit='blueberry',
+                      quantity=2,
+                      unit_price=2.00),
+              ]),
+          (
+              NamedTuple(recipe='muffin', is_berry=False),
+              [
+                  beam.Row(
+                      recipe='muffin',
+                      fruit='banana',
+                      quantity=3,
+                      unit_price=1.00),
+              ]),
           #[END groupby_attr_expr_result]
       ]
       assert_that(grouped | beam.MapTuple(normalize_kv), equal_to(expected))
@@ -174,8 +230,8 @@ def test_simple_aggregate(self):
       grouped = (
           p
           | beam.Create(GROCERY_LIST)
-          | beam.GroupBy('fruit')
-              .aggregate_field('quantity', sum, 'total_quantity'))
+          | beam.GroupBy('fruit').aggregate_field(
+              'quantity', sum, 'total_quantity'))
       # [END simple_aggregate]
 
       expected = [
@@ -195,9 +251,9 @@ def test_expr_aggregate(self):
       grouped = (
           p
           | beam.Create(GROCERY_LIST)
-          | beam.GroupBy('recipe')
-              .aggregate_field('quantity', sum, 'total_quantity')
-              .aggregate_field(lambda x: x.quantity * x.unit_price, sum, 'price'))
+          | beam.GroupBy('recipe').aggregate_field(
+              'quantity', sum, 'total_quantity').aggregate_field(
+                  lambda x: x.quantity * x.unit_price, sum, 'price'))
       # [END expr_aggregate]
 
       expected = [
@@ -214,10 +270,10 @@ def test_global_aggregate(self):
       grouped = (
           p
           | beam.Create(GROCERY_LIST)
-          | beam.GroupBy()
-              .aggregate_field('unit_price', min, 'min_price')
-              .aggregate_field('unit_price', MeanCombineFn(), 'mean_price')
-              .aggregate_field('unit_price', max, 'max_price'))
+          | beam.GroupBy().aggregate_field(
+              'unit_price', min, 'min_price').aggregate_field(
+                  'unit_price', MeanCombineFn(), 'mean_price').aggregate_field(
+                      'unit_price', max, 'max_price'))
       # [END global_aggregate]
 
       expected = [
diff --git a/sdks/python/apache_beam/ml/inference/base.py b/sdks/python/apache_beam/ml/inference/base.py
@@ -337,6 +337,8 @@ def __init__(self, namespace: str):
     # Metrics
     self._inference_counter = beam.metrics.Metrics.counter(
         namespace, 'num_inferences')
+    self.failed_batches_counter = beam.metrics.Metrics.counter(
+        namespace, 'failed_batches_counter')
     self._inference_request_batch_size = beam.metrics.Metrics.distribution(
         namespace, 'inference_request_batch_size')
     self._inference_request_batch_byte_size = (
@@ -426,8 +428,12 @@ def setup(self):
 
   def process(self, batch, inference_args):
     start_time = _to_microseconds(self._clock.time_ns())
-    result_generator = self._model_handler.run_inference(
-        batch, self._model, inference_args)
+    try:
+      result_generator = self._model_handler.run_inference(
+          batch, self._model, inference_args)
+    except BaseException as e:
+      self._metrics_collector.failed_batches_counter.inc()
+      raise e
     predictions = list(result_generator)
 
     end_time = _to_microseconds(self._clock.time_ns())
diff --git a/sdks/python/apache_beam/ml/inference/base_test.py b/sdks/python/apache_beam/ml/inference/base_test.py
@@ -175,6 +175,37 @@ def test_unexpected_inference_args_passed(self):
             FakeModelHandlerFailsOnInferenceArgs(),
             inference_args=inference_args)
 
+  def test_increment_failed_batches_counter(self):
+    with self.assertRaises(ValueError):
+      with TestPipeline() as pipeline:
+        examples = [7]
+        pcoll = pipeline | 'start' >> beam.Create(examples)
+        _ = pcoll | base.RunInference(FakeModelHandlerExpectedInferenceArgs())
+        run_result = pipeline.run()
+        run_result.wait_until_finish()
+
+        metric_results = (
+            run_result.metrics().query(
+                MetricsFilter().with_name('failed_batches_counter')))
+        num_failed_batches_counter = metric_results['counters'][0]
+        self.assertEqual(num_failed_batches_counter.committed, 3)
+        # !!!: The above will need to be updated if retry behavior changes
+
+  def test_failed_batches_counter_no_failures(self):
+    pipeline = TestPipeline()
+    examples = [7]
+    pcoll = pipeline | 'start' >> beam.Create(examples)
+    inference_args = {'key': True}
+    _ = pcoll | base.RunInference(
+        FakeModelHandlerExpectedInferenceArgs(), inference_args=inference_args)
+    run_result = pipeline.run()
+    run_result.wait_until_finish()
+
+    metric_results = (
+        run_result.metrics().query(
+            MetricsFilter().with_name('failed_batches_counter')))
+    self.assertEqual(len(metric_results['counters']), 0)
+
   def test_counted_metrics(self):
     pipeline = TestPipeline()
     examples = [1, 5, 3, 10]