Clean up

charlespnh · charlespnh · commit a635995214f5 · 2025-06-19T10:49:55.000-04:00
diff --git a/sdks/python/apache_beam/yaml/examples/testing/examples_test.py b/sdks/python/apache_beam/yaml/examples/testing/examples_test.py
@@ -120,7 +120,20 @@ def test_kafka_read(
     auto_offset_reset_config,
     consumer_config):
   """
-  ...
+  This PTransform simulates the behavior of the ReadFromKafka transform
+  with the RAW format by simply using some fixed sample text data and
+  encode it to raw bytes.
+
+  Args:
+    pcoll: The input PCollection.
+    format:
+    topic:
+    bootstrap_servers:
+    auto_offset_reset_config:
+    consumer_config:
+
+  Returns:
+    A PCollection containing the sample text data in bytes.
   """
 
   return (
@@ -131,7 +144,15 @@ def test_kafka_read(
 @beam.ptransform.ptransform_fn
 def test_run_inference(pcoll, inference_tag, model_handler):
   """
-  ...
+  This PTransform simulates the behavior of the RunInference transform.
+
+  Args:
+    pcoll: The input PCollection.
+    inference_tag: The tag to use for the returned inference.
+    model_handler: A configuration for the respective ML model handler
+
+  Returns:
+    A PCollection containing the enriched data.
   """
 
   from apache_beam.ml.inference.base import PredictionResult
diff --git a/sdks/python/apache_beam/yaml/examples/transforms/ml/inference/README.md b/sdks/python/apache_beam/yaml/examples/transforms/ml/inference/README.md
@@ -61,7 +61,7 @@ create/write to a table. See [here](
 https://cloud.google.com/bigquery/docs/datasets) for how to create
 BigQuery datasets.
 
-Then pipeline first reads the YouTube comments .csv dataset from
+The pipeline first reads the YouTube comments .csv dataset from
 GCS bucket and performs some clean-up before writing it to a Kafka 
 topic. The pipeline then reads from that Kafka topic and applies
 various transformation logic before `RunInference` transform performs
diff --git a/sdks/python/apache_beam/yaml/examples/transforms/ml/inference/streaming_sentiment_analysis.yaml b/sdks/python/apache_beam/yaml/examples/transforms/ml/inference/streaming_sentiment_analysis.yaml
@@ -16,7 +16,7 @@
 # limitations under the License.
 #
 
-# Then pipeline first reads the YouTube comments .csv dataset from GCS bucket
+# The pipeline first reads the YouTube comments .csv dataset from GCS bucket
 # and performs necessary clean-up before writing it to a Kafka topic.
 # The pipeline then reads from that Kafka topic and applies various transformation
 # logic before RunInference transform performs remote inference with the Vertex AI

Original file line number	Diff line number	Diff line change
`@@ -16,7 +16,7 @@`
`16`	`16`	`# limitations under the License.`
`17`	`17`	`#`
`18`	`18`
`19`		`-# Then pipeline first reads the YouTube comments .csv dataset from GCS bucket`
	`19`	`+# The pipeline first reads the YouTube comments .csv dataset from GCS bucket`
`20`	`20`	`# and performs necessary clean-up before writing it to a Kafka topic.`
`21`	`21`	`# The pipeline then reads from that Kafka topic and applies various transformation`
`22`	`22`	`# logic before RunInference transform performs remote inference with the Vertex AI`