taegeonum commented on a change in pull request #137: [NEMO-232] Implement InputWatermarkManager URL: https://github.com/apache/incubator-nemo/pull/137#discussion_r229897058
########## File path: runtime/executor/src/main/java/org/apache/nemo/runtime/executor/datatransfer/MultiInputWatermarkManager.java ########## @@ -0,0 +1,78 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. The ASF licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ +package org.apache.nemo.runtime.executor.datatransfer; + +import org.apache.nemo.common.ir.vertex.OperatorVertex; +import org.apache.nemo.common.punctuation.Watermark; + +/** + * This tracks the minimum input watermark among multiple input streams. + */ +public final class MultiInputWatermarkManager implements InputWatermarkManager { + private final Watermark[] watermarks; + private final OperatorVertex nextOperator; + private int minWatermarkIndex; + public MultiInputWatermarkManager(final int numEdges, + final OperatorVertex nextOperator) { + super(); + this.watermarks = new Watermark[numEdges]; + this.nextOperator = nextOperator; + this.minWatermarkIndex = 0; + // We initialize watermarks as min value because + // we should not emit watermark until all edges emit watermarks. + for (int i = 0; i < numEdges; i++) { + watermarks[i] = new Watermark(Long.MIN_VALUE); + } + } + + private int findNextMinWatermarkIndex() { + int index = -1; + long timestamp = Long.MAX_VALUE; + for (int i = 0; i < watermarks.length; i++) { + if (watermarks[i].getTimestamp() < timestamp) { + index = i; + timestamp = watermarks[i].getTimestamp(); + } + } + return index; + } + + @Override + public void trackAndEmitWatermarks(final int edgeIndex, final Watermark watermark) { + if (edgeIndex == minWatermarkIndex) { + // update min watermark + final Watermark prevMinWatermark = watermarks[minWatermarkIndex]; + watermarks[minWatermarkIndex] = watermark; + // find min watermark + minWatermarkIndex = findNextMinWatermarkIndex(); + final Watermark minWatermark = watermarks[minWatermarkIndex]; + assert minWatermark.getTimestamp() >= prevMinWatermark.getTimestamp(); Review comment: Assertion is for debugging and it does not affect on the performance, and I think this helps to understand the code more easily. Are there any reason why nemo do not use assertion in code? ---------------------------------------------------------------- This is an automated message from the Apache Git Service. To respond to the message, please log on GitHub and use the URL above to go to the specific comment. For queries about this service, please contact Infrastructure at: us...@infra.apache.org With regards, Apache Git Services