pabloem commented on a change in pull request #10497: [BEAM-8335] Add the ReverseTestStream URL: https://github.com/apache/beam/pull/10497#discussion_r385983264
########## File path: sdks/python/apache_beam/runners/direct/transform_evaluator.py ########## @@ -432,6 +439,45 @@ def finish_bundle(self): self, self.bundles, [], None, {None: self._watermark}) +class PairWithTimingEvaluator(_TransformEvaluator): + """TransformEvaluator for the PairWithTiming transform. + + This transform takes an element as an input and outputs + KV(element, `TimingInfo`). Where the `TimingInfo` contains both the + processing time timestamp and watermark. + """ + def __init__( + self, + evaluation_context, + applied_ptransform, + input_committed_bundle, + side_inputs): + assert not side_inputs + super(PairWithTimingEvaluator, self).__init__( + evaluation_context, + applied_ptransform, + input_committed_bundle, + side_inputs) + + def start_bundle(self): + main_output = list(self._outputs)[0] + self.bundle = self._evaluation_context.create_bundle(main_output) + + def process_element(self, element): + watermark_manager = self._evaluation_context._watermark_manager + watermarks = watermark_manager.get_watermarks(self._applied_ptransform) Review comment: For performance, it may be worth considering evaluating watermark and processing time once, rather than on every element. ---------------------------------------------------------------- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. For queries about this service, please contact Infrastructure at: us...@infra.apache.org With regards, Apache Git Services