apache · dnamaz · Dec 6, 2025 · Dec 6, 2025 · Dec 8, 2025 · Dec 9, 2025
diff --git a/CHANGES.md b/CHANGES.md
@@ -84,6 +84,7 @@
 
 ## Bugfixes
 
+* Fixed Flink classic runner failing with "No translator known for PrimitiveUnboundedRead" when using unbounded source connectors like KinesisIO after SDF-to-primitive-read conversion (Java) ([#37035](https://github.com/apache/beam/issues/37035)).
 * Fixed FirestoreV1 Beam connectors allow configuring inconsistent project/database IDs between RPC requests and routing headers #36895 (Java) ([#36895](https://github.com/apache/beam/issues/36895)).
  Logical type and coder registry are saved for pipelines in the case of default pickler. This fixes a side effect of switching to cloudpickle as default pickler in Beam 2.65.0 (Python) ([#35738](https://github.com/apache/beam/issues/35738)).
 

diff --git a/...flink/src/main/java/org/apache/beam/runners/flink/FlinkStreamingTransformTranslators.java b/...flink/src/main/java/org/apache/beam/runners/flink/FlinkStreamingTransformTranslators.java
@@ -97,6 +97,7 @@
 import org.apache.beam.sdk.values.WindowingStrategy;
 import org.apache.beam.vendor.guava.v32_1_2_jre.com.google.common.annotations.VisibleForTesting;
 import org.apache.beam.vendor.guava.v32_1_2_jre.com.google.common.collect.ImmutableMap;
+import org.apache.beam.vendor.guava.v32_1_2_jre.com.google.common.collect.Iterables;
 import org.apache.beam.vendor.guava.v32_1_2_jre.com.google.common.collect.Maps;
 import org.apache.flink.api.common.eventtime.WatermarkStrategy;
 import org.apache.flink.api.common.functions.FlatMapFunction;
@@ -174,6 +175,14 @@ class FlinkStreamingTransformTranslators {
 
   public static FlinkStreamingPipelineTranslator.StreamTransformTranslator<?> getTranslator(
       PTransform<?, ?> transform) {
+    // Handle PrimitiveUnboundedRead explicitly (created by SplittableParDo conversion)
+    if (transform instanceof SplittableParDo.PrimitiveUnboundedRead) {
+      return new PrimitiveUnboundedReadTranslator<>();
+    }
+    // Handle PrimitiveBoundedRead explicitly
+    if (transform instanceof SplittableParDo.PrimitiveBoundedRead) {
+      return new PrimitiveBoundedReadTranslator<>();
+    }
     @Nullable String urn = PTransformTranslation.urnForTransformOrNull(transform);
     return urn == null ? null : TRANSLATORS.get(urn);
   }
@@ -183,33 +192,131 @@ public static String getCurrentTransformName(FlinkStreamingTranslationContext co
     return context.getCurrentTransform().getFullName();
   }
 
+  /** Returns the parallelism to use for source operators. */
+  private static int getSourceParallelism(FlinkStreamingTranslationContext context) {
+    int maxParallelism = context.getExecutionEnvironment().getMaxParallelism();
+    return maxParallelism > 0 ? maxParallelism : context.getExecutionEnvironment().getParallelism();
+  }
+
   // --------------------------------------------------------------------------------------------
   //  Transformation Implementations
   // --------------------------------------------------------------------------------------------
 
+  /** Common translation logic for unbounded sources. */
+  @SuppressWarnings("unchecked")
+  private static <T> void translateUnboundedSource(
+      UnboundedSource<T, ?> rawSource,
+      String transformName,
+      FlinkStreamingTranslationContext context) {
+
+    PCollection<T> output =
+        (PCollection<T>)
+            Iterables.getOnlyElement(context.getCurrentTransform().getOutputs().values());
+
+    DataStream<WindowedValue<T>> source;
+    DataStream<WindowedValue<ValueWithRecordId<T>>> nonDedupSource;
+    TypeInformation<WindowedValue<T>> outputTypeInfo = context.getTypeInfo(output);
+
+    Coder<T> coder = output.getCoder();
+
+    TypeInformation<WindowedValue<ValueWithRecordId<T>>> withIdTypeInfo =
+        new CoderTypeInformation<>(
+            WindowedValues.getFullCoder(
+                ValueWithRecordId.ValueWithRecordIdCoder.of(coder),
+                output.getWindowingStrategy().getWindowFn().windowCoder()),
+            context.getPipelineOptions());
+
+    String fullName = getCurrentTransformName(context);
+    try {
+      int parallelism = getSourceParallelism(context);
+
+      FlinkUnboundedSource<T> unboundedSource =
+          FlinkSource.unbounded(
+              transformName,
+              rawSource,
+              new SerializablePipelineOptions(context.getPipelineOptions()),
+              parallelism);
+      nonDedupSource =
+          context
+              .getExecutionEnvironment()
+              .fromSource(
+                  unboundedSource, WatermarkStrategy.noWatermarks(), fullName, withIdTypeInfo)
+              .uid(fullName);
+
+      if (rawSource.requiresDeduping()) {
+        source =
+            nonDedupSource
+                .keyBy(new ValueWithRecordIdKeySelector<>())
+                .transform(
+                    "deduping",
+                    outputTypeInfo,
+                    new DedupingOperator<>(context.getPipelineOptions()))
+                .uid(format("%s/__deduplicated__", fullName));
+      } else {
+        source =
+            nonDedupSource
+                .flatMap(new StripIdsMap<>(context.getPipelineOptions()))
+                .returns(outputTypeInfo);
+      }
+    } catch (Exception e) {
+      throw new RuntimeException("Error while translating UnboundedSource: " + rawSource, e);
+    }
+
+    context.setOutputDataStream(output, source);
+  }
+
+  /** Common translation logic for bounded sources. */
+  @SuppressWarnings("unchecked")
+  private static <T> void translateBoundedSource(
+      BoundedSource<T> rawSource, String transformName, FlinkStreamingTranslationContext context) {
+
+    PCollection<T> output =
+        (PCollection<T>)
+            Iterables.getOnlyElement(context.getCurrentTransform().getOutputs().values());
+
+    TypeInformation<WindowedValue<T>> outputTypeInfo = context.getTypeInfo(output);
+
+    String fullName = getCurrentTransformName(context);
+    int parallelism = getSourceParallelism(context);
+
+    FlinkBoundedSource<T> flinkBoundedSource =
+        FlinkSource.bounded(
+            transformName,
+            rawSource,
+            new SerializablePipelineOptions(context.getPipelineOptions()),
+            parallelism);
+
+    SingleOutputStreamOperator<WindowedValue<T>> source;
+    try {
+      source =
+          context
+              .getExecutionEnvironment()
+              .fromSource(
+                  flinkBoundedSource, WatermarkStrategy.noWatermarks(), fullName, outputTypeInfo)
+              .uid(fullName)
+              .returns(outputTypeInfo);
+
+      if (!context.isStreaming()
+          && context
+              .getPipelineOptions()
+              .as(FlinkPipelineOptions.class)
+              .getForceSlotSharingGroup()) {
+        source = source.slotSharingGroup(FORCED_SLOT_GROUP);
+      }
+    } catch (Exception e) {
+      throw new RuntimeException("Error while translating BoundedSource: " + rawSource, e);
+    }
+
+    context.setOutputDataStream(output, source);
+  }
+
   private static class UnboundedReadSourceTranslator<T>
       extends FlinkStreamingPipelineTranslator.StreamTransformTranslator<
           PTransform<PBegin, PCollection<T>>> {
 
     @Override
     public void translateNode(
         PTransform<PBegin, PCollection<T>> transform, FlinkStreamingTranslationContext context) {
-      PCollection<T> output = context.getOutput(transform);
-
-      DataStream<WindowedValue<T>> source;
-      DataStream<WindowedValue<ValueWithRecordId<T>>> nonDedupSource;
-      TypeInformation<WindowedValue<T>> outputTypeInfo =
-          context.getTypeInfo(context.getOutput(transform));
-
-      Coder<T> coder = context.getOutput(transform).getCoder();
-
-      TypeInformation<WindowedValue<ValueWithRecordId<T>>> withIdTypeInfo =
-          new CoderTypeInformation<>(
-              WindowedValues.getFullCoder(
-                  ValueWithRecordId.ValueWithRecordIdCoder.of(coder),
-                  output.getWindowingStrategy().getWindowFn().windowCoder()),
-              context.getPipelineOptions());
-
       UnboundedSource<T, ?> rawSource;
       try {
         rawSource =
@@ -219,47 +326,43 @@ public void translateNode(
       } catch (IOException e) {
         throw new RuntimeException(e);
       }
+      translateUnboundedSource(rawSource, transform.getName(), context);
+    }
+  }
 
-      String fullName = getCurrentTransformName(context);
-      try {
-        int parallelism =
-            context.getExecutionEnvironment().getMaxParallelism() > 0
-                ? context.getExecutionEnvironment().getMaxParallelism()
-                : context.getExecutionEnvironment().getParallelism();
-
-        FlinkUnboundedSource<T> unboundedSource =
-            FlinkSource.unbounded(
-                transform.getName(),
-                rawSource,
-                new SerializablePipelineOptions(context.getPipelineOptions()),
-                parallelism);
-        nonDedupSource =
-            context
-                .getExecutionEnvironment()
-                .fromSource(
-                    unboundedSource, WatermarkStrategy.noWatermarks(), fullName, withIdTypeInfo)
-                .uid(fullName);
+  /**
+   * Translator for {@link SplittableParDo.PrimitiveUnboundedRead}.
+   *
+   * <p>This handles the case where Read.Unbounded is converted to PrimitiveUnboundedRead by {@link
+   * SplittableParDo#convertReadBasedSplittableDoFnsToPrimitiveReadsIfNecessary}.
+   */
+  private static class PrimitiveUnboundedReadTranslator<T>
+      extends FlinkStreamingPipelineTranslator.StreamTransformTranslator<
+          SplittableParDo.PrimitiveUnboundedRead<T>> {
 
-        if (rawSource.requiresDeduping()) {
-          source =
-              nonDedupSource
-                  .keyBy(new ValueWithRecordIdKeySelector<>())
-                  .transform(
-                      "deduping",
-                      outputTypeInfo,
-                      new DedupingOperator<>(context.getPipelineOptions()))
-                  .uid(format("%s/__deduplicated__", fullName));
-        } else {
-          source =
-              nonDedupSource
-                  .flatMap(new StripIdsMap<>(context.getPipelineOptions()))
-                  .returns(outputTypeInfo);
-        }
-      } catch (Exception e) {
-        throw new RuntimeException("Error while translating UnboundedSource: " + rawSource, e);
-      }
+    @Override
+    public void translateNode(
+        SplittableParDo.PrimitiveUnboundedRead<T> transform,
+        FlinkStreamingTranslationContext context) {
+      translateUnboundedSource(transform.getSource(), transform.getName(), context);
+    }
+  }
+
+  /**
+   * Translator for {@link SplittableParDo.PrimitiveBoundedRead}.
+   *
+   * <p>This handles the case where Read.Bounded is converted to PrimitiveBoundedRead by {@link
+   * SplittableParDo#convertReadBasedSplittableDoFnsToPrimitiveReadsIfNecessary}.
+   */
+  private static class PrimitiveBoundedReadTranslator<T>
+      extends FlinkStreamingPipelineTranslator.StreamTransformTranslator<
+          SplittableParDo.PrimitiveBoundedRead<T>> {
 
-      context.setOutputDataStream(output, source);
+    @Override
+    public void translateNode(
+        SplittableParDo.PrimitiveBoundedRead<T> transform,
+        FlinkStreamingTranslationContext context) {
+      translateBoundedSource(transform.getSource(), transform.getName(), context);
     }
   }
 
@@ -372,11 +475,6 @@ private static class BoundedReadSourceTranslator<T>
     @Override
     public void translateNode(
         PTransform<PBegin, PCollection<T>> transform, FlinkStreamingTranslationContext context) {
-      PCollection<T> output = context.getOutput(transform);
-
-      TypeInformation<WindowedValue<T>> outputTypeInfo =
-          context.getTypeInfo(context.getOutput(transform));
-
       BoundedSource<T> rawSource;
       try {
         rawSource =
@@ -386,43 +484,7 @@ public void translateNode(
       } catch (IOException e) {
         throw new RuntimeException(e);
       }
-
-      String fullName = getCurrentTransformName(context);
-      int parallelism =
-          context.getExecutionEnvironment().getMaxParallelism() > 0
-              ? context.getExecutionEnvironment().getMaxParallelism()
-              : context.getExecutionEnvironment().getParallelism();
-
-      FlinkBoundedSource<T> flinkBoundedSource =
-          FlinkSource.bounded(
-              transform.getName(),
-              rawSource,
-              new SerializablePipelineOptions(context.getPipelineOptions()),
-              parallelism);
-
-      TypeInformation<WindowedValue<T>> typeInfo = context.getTypeInfo(output);
-
-      SingleOutputStreamOperator<WindowedValue<T>> source;
-      try {
-        source =
-            context
-                .getExecutionEnvironment()
-                .fromSource(
-                    flinkBoundedSource, WatermarkStrategy.noWatermarks(), fullName, outputTypeInfo)
-                .uid(fullName)
-                .returns(typeInfo);
-
-        if (!context.isStreaming()
-            && context
-                .getPipelineOptions()
-                .as(FlinkPipelineOptions.class)
-                .getForceSlotSharingGroup()) {
-          source = source.slotSharingGroup(FORCED_SLOT_GROUP);
-        }
-      } catch (Exception e) {
-        throw new RuntimeException("Error while translating BoundedSource: " + rawSource, e);
-      }
-      context.setOutputDataStream(output, source);
+      translateBoundedSource(rawSource, transform.getName(), context);
     }
   }