Github user twalthr commented on a diff in the pull request:

    https://github.com/apache/flink/pull/2562#discussion_r82133014
  
    --- Diff: 
flink-libraries/flink-table/src/test/scala/org/apache/flink/api/scala/stream/table/GroupWindowITCase.scala
 ---
    @@ -0,0 +1,777 @@
    +/*
    + * Licensed to the Apache Software Foundation (ASF) under one
    + * or more contributor license agreements.  See the NOTICE file
    + * distributed with this work for additional information
    + * regarding copyright ownership.  The ASF licenses this file
    + * to you under the Apache License, Version 2.0 (the
    + * "License"); you may not use this file except in compliance
    + * with the License.  You may obtain a copy of the License at
    + *
    + *     http://www.apache.org/licenses/LICENSE-2.0
    + *
    + * Unless required by applicable law or agreed to in writing, software
    + * distributed under the License is distributed on an "AS IS" BASIS,
    + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
    + * See the License for the specific language governing permissions and
    + * limitations under the License.
    + */
    +
    +package org.apache.flink.api.scala.stream.table
    +
    +import org.apache.flink.api.scala._
    +import 
org.apache.flink.api.scala.stream.table.GroupWindowITCase.TimestampWithEqualWatermark
    +import org.apache.flink.api.scala.stream.utils.StreamITCase
    +import org.apache.flink.api.scala.table._
    +import org.apache.flink.api.table.{Row, _}
    +import org.apache.flink.streaming.api.TimeCharacteristic
    +import 
org.apache.flink.streaming.api.functions.AssignerWithPunctuatedWatermarks
    +import org.apache.flink.streaming.api.scala.StreamExecutionEnvironment
    +import org.apache.flink.streaming.api.watermark.Watermark
    +import org.apache.flink.streaming.util.StreamingMultipleProgramsTestBase
    +import org.junit.Assert._
    +import org.junit.Test
    +
    +import scala.collection.mutable
    +
    +class GroupWindowITCase extends StreamingMultipleProgramsTestBase {
    +
    +  @Test(expected = classOf[ValidationException])
    +  def testInvalidBatchWindow(): Unit = {
    +    val env = ExecutionEnvironment.getExecutionEnvironment
    +    val tEnv = TableEnvironment.getTableEnvironment(env)
    +    val data = new mutable.MutableList[(Long, Int, String)]
    +    val stream = env.fromCollection(data)
    +    val table = stream.toTable(tEnv, 'long, 'int, 'string)
    +
    +    table
    +      .groupBy('string)
    +      .window(Session withGap 10.rows as 'string)
    +  }
    +
    +  @Test(expected = classOf[TableException])
    +  def testInvalidRowtime1(): Unit = {
    +    val env = StreamExecutionEnvironment.getExecutionEnvironment
    +    val tEnv = TableEnvironment.getTableEnvironment(env)
    +    val data = new mutable.MutableList[(Long, Int, String)]
    +    val stream = env.fromCollection(data)
    +    val table = stream.toTable(tEnv, 'rowtime, 'int, 'string)
    +
    +    table
    +      .groupBy('string)
    +      .window(Tumble over 50.milli)
    +      .select('string, 'int.count)
    +  }
    +
    +  @Test(expected = classOf[ValidationException])
    +  def testInvalidRowtime2(): Unit = {
    +    val env = StreamExecutionEnvironment.getExecutionEnvironment
    +    val tEnv = TableEnvironment.getTableEnvironment(env)
    +    val data = new mutable.MutableList[(Long, Int, String)]
    +    val stream = env.fromCollection(data)
    +    val table = stream.toTable(tEnv, 'long, 'int, 'string)
    +
    +    table
    +      .groupBy('string)
    +      .window(Tumble over 50.milli)
    +      .select('string, 'int.count as 'rowtime)
    +  }
    +
    +  @Test(expected = classOf[ValidationException])
    +  def testInvalidRowtime3(): Unit = {
    +    val env = StreamExecutionEnvironment.getExecutionEnvironment
    +    val tEnv = TableEnvironment.getTableEnvironment(env)
    +    val data = new mutable.MutableList[(Long, Int, String)]
    +    val stream = env.fromCollection(data)
    +    val table = stream.toTable(tEnv, 'long, 'int, 'string)
    +
    +    table.as('rowtime, 'myint, 'mystring)
    +  }
    +
    +  @Test(expected = classOf[ValidationException])
    +  def testInvalidRowtime4(): Unit = {
    +    val env = StreamExecutionEnvironment.getExecutionEnvironment
    +    val tEnv = TableEnvironment.getTableEnvironment(env)
    +    val data = new mutable.MutableList[(Long, Int, String)]
    +    val stream = env.fromCollection(data)
    +    val table = stream.toTable(tEnv, 'long, 'int, 'string)
    +
    +    table
    +      .groupBy('string)
    +      .window(Tumble over 50.milli on 'string)
    +      .select('string, 'int.count)
    +  }
    +
    +  @Test(expected = classOf[ValidationException])
    +  def testInvalidTumblingSize(): Unit = {
    +    val env = StreamExecutionEnvironment.getExecutionEnvironment
    +    val tEnv = TableEnvironment.getTableEnvironment(env)
    +    val data = new mutable.MutableList[(Long, Int, String)]
    +    val stream = env.fromCollection(data)
    +    val table = stream.toTable(tEnv, 'long, 'int, 'string)
    +
    +    table
    +      .groupBy('string)
    +      .window(Tumble over "WRONG")
    +      .select('string, 'int.count)
    +  }
    +
    +  @Test(expected = classOf[ValidationException])
    +  def testInvalidSlidingSize(): Unit = {
    +    val env = StreamExecutionEnvironment.getExecutionEnvironment
    +    val tEnv = TableEnvironment.getTableEnvironment(env)
    +    val data = new mutable.MutableList[(Long, Int, String)]
    +    val stream = env.fromCollection(data)
    +    val table = stream.toTable(tEnv, 'long, 'int, 'string)
    +
    +    table
    +      .groupBy('string)
    +      .window(Slide over "WRONG" every "WRONG")
    +      .select('string, 'int.count)
    +  }
    +
    +  @Test(expected = classOf[ValidationException])
    +  def testInvalidSlidingSlide(): Unit = {
    +    val env = StreamExecutionEnvironment.getExecutionEnvironment
    +    val tEnv = TableEnvironment.getTableEnvironment(env)
    +    val data = new mutable.MutableList[(Long, Int, String)]
    +    val stream = env.fromCollection(data)
    +    val table = stream.toTable(tEnv, 'long, 'int, 'string)
    +
    +    table
    +      .groupBy('string)
    +      .window(Slide over 12.rows every "WRONG")
    +      .select('string, 'int.count)
    +  }
    +
    +  @Test(expected = classOf[ValidationException])
    +  def testInvalidSessionGap(): Unit = {
    +    val env = StreamExecutionEnvironment.getExecutionEnvironment
    +    val tEnv = TableEnvironment.getTableEnvironment(env)
    +    val data = new mutable.MutableList[(Long, Int, String)]
    +    val stream = env.fromCollection(data)
    +    val table = stream.toTable(tEnv, 'long, 'int, 'string)
    +
    +    table
    +      .groupBy('string)
    +      .window(Session withGap 10.rows)
    +      .select('string, 'int.count)
    +  }
    +
    +  @Test(expected = classOf[ValidationException])
    +  def testInvalidWindowAlias1(): Unit = {
    +    val env = StreamExecutionEnvironment.getExecutionEnvironment
    +    val tEnv = TableEnvironment.getTableEnvironment(env)
    +    val data = new mutable.MutableList[(Long, Int, String)]
    +    val stream = env.fromCollection(data)
    +    val table = stream.toTable(tEnv, 'long, 'int, 'string)
    +
    +    table
    +      .groupBy('string)
    +      .window(Session withGap 10.rows as 1 + 1)
    +      .select('string, 'int.count)
    +  }
    +
    +  @Test(expected = classOf[ValidationException])
    +  def testInvalidWindowAlias2(): Unit = {
    +    val env = StreamExecutionEnvironment.getExecutionEnvironment
    +    val tEnv = TableEnvironment.getTableEnvironment(env)
    +    val data = new mutable.MutableList[(Long, Int, String)]
    +    val stream = env.fromCollection(data)
    +    val table = stream.toTable(tEnv, 'long, 'int, 'string)
    +
    +    table
    +      .groupBy('string)
    +      .window(Session withGap 10.rows as 'string)
    +      .select('string, 'int.count)
    +  }
    +
    +  @Test
    +  def testProcessingTimeTumblingGroupWindowOverTime(): Unit = {
    +    val env = StreamExecutionEnvironment.getExecutionEnvironment
    +    env.setStreamTimeCharacteristic(TimeCharacteristic.EventTime)
    +    val tEnv = TableEnvironment.getTableEnvironment(env)
    +    StreamITCase.testResults = mutable.MutableList()
    +
    +    val data = new mutable.MutableList[(Long, Int, String)]
    +    data.+=((1L, 1, "Hi"))
    +    data.+=((2L, 2, "Hello"))
    +    data.+=((4L, 2, "Hello"))
    +    data.+=((8L, 3, "Hello world"))
    +    data.+=((16L, 3, "Hello world"))
    +    val stream = env.fromCollection(data)
    +
    +    val table = stream.toTable(tEnv, 'long, 'int, 'string)
    +
    +    val windowedTable = table
    +      .groupBy('string)
    +      .window(Tumble over 50.milli)
    +      .select('string, 'int.count)
    +
    +    // we only test if validation is successful here since processing time 
is non-deterministic
    +    windowedTable.toDataStream[Row]
    +  }
    +
    +  @Test
    +  def testProcessingTimeTumblingGroupWindowOverCount(): Unit = {
    +    val env = StreamExecutionEnvironment.getExecutionEnvironment
    +    env.setStreamTimeCharacteristic(TimeCharacteristic.EventTime)
    +    val tEnv = TableEnvironment.getTableEnvironment(env)
    +    StreamITCase.testResults = mutable.MutableList()
    +
    +    val data = new mutable.MutableList[(Long, Int, String)]
    +    data.+=((1L, 1, "Hi"))
    +    data.+=((2L, 2, "Hello"))
    +    data.+=((4L, 2, "Hello"))
    +    data.+=((8L, 3, "Hello world"))
    +    data.+=((16L, 3, "Hello world"))
    +    val stream = env.fromCollection(data)
    +
    +    val table = stream.toTable(tEnv, 'long, 'int, 'string)
    +
    +    val windowedTable = table
    +      .groupBy('string)
    +      .window(Tumble over 2.rows)
    +      .select('string, 'int.count)
    +
    +    val results = windowedTable.toDataStream[Row]
    +    results.addSink(new StreamITCase.StringSink)
    +    env.execute()
    +
    +    val expected = Seq("Hello world,2", "Hello,2")
    +    assertEquals(expected.sorted, StreamITCase.testResults.sorted)
    +  }
    +
    +  @Test
    +  def testEventTimeTumblingGroupWindowOverTime(): Unit = {
    +    val env = StreamExecutionEnvironment.getExecutionEnvironment
    +    env.setStreamTimeCharacteristic(TimeCharacteristic.EventTime)
    +    val tEnv = TableEnvironment.getTableEnvironment(env)
    +    StreamITCase.testResults = mutable.MutableList()
    +
    +    val data = new mutable.MutableList[(Long, Int, String)]
    +    data.+=((1L, 1, "Hi"))
    +    data.+=((2L, 2, "Hello"))
    +    data.+=((4L, 2, "Hello"))
    +    data.+=((8L, 3, "Hello world"))
    +    data.+=((16L, 3, "Hello world"))
    +    val stream = env
    +      .fromCollection(data)
    +      .assignTimestampsAndWatermarks(new TimestampWithEqualWatermark())
    +
    +    val table = stream.toTable(tEnv, 'long, 'int, 'string)
    +
    +    val windowedTable = table
    +      .groupBy('string)
    +      .window(Tumble over 5.milli on 'rowtime)
    +      .select('string, 'int.count)
    +
    +    val results = windowedTable.toDataStream[Row]
    +    results.addSink(new StreamITCase.StringSink)
    +    env.execute()
    +
    +    val expected = Seq("Hello world,1", "Hello world,1", "Hello,2", "Hi,1")
    +    assertEquals(expected.sorted, StreamITCase.testResults.sorted)
    +  }
    +
    +  @Test
    +  def testEventTimeTumblingGroupWindowOverCount(): Unit = {
    +    val env = StreamExecutionEnvironment.getExecutionEnvironment
    +    env.setStreamTimeCharacteristic(TimeCharacteristic.EventTime)
    +    val tEnv = TableEnvironment.getTableEnvironment(env)
    +    StreamITCase.testResults = mutable.MutableList()
    +
    +    val data = new mutable.MutableList[(Long, Int, String)]
    +    data.+=((1L, 1, "Hi"))
    +    data.+=((2L, 2, "Hello"))
    +    data.+=((4L, 2, "Hello"))
    +    data.+=((8L, 3, "Hello world"))
    +    data.+=((16L, 3, "Hello world"))
    +    val stream = env
    +      .fromCollection(data)
    +      .assignTimestampsAndWatermarks(new TimestampWithEqualWatermark())
    +
    +    val table = stream.toTable(tEnv, 'long, 'int, 'string)
    +
    +    val windowedTable = table
    +      .groupBy('string)
    +      .window(Tumble over 2.rows on 'rowtime)
    +      .select('string, 'int.count)
    +
    +    val results = windowedTable.toDataStream[Row]
    +    results.addSink(new StreamITCase.StringSink)
    +    env.execute()
    +
    +    val expected = Seq("Hello world,2", "Hello,2")
    +    assertEquals(expected.sorted, StreamITCase.testResults.sorted)
    +  }
    +
    +  @Test
    +  def testProcessingTimeSlidingGroupWindowOverTime(): Unit = {
    +    val env = StreamExecutionEnvironment.getExecutionEnvironment
    +    env.setStreamTimeCharacteristic(TimeCharacteristic.EventTime)
    +    val tEnv = TableEnvironment.getTableEnvironment(env)
    +    StreamITCase.testResults = mutable.MutableList()
    +
    +    val data = new mutable.MutableList[(Long, Int, String)]
    +    data.+=((1L, 1, "Hi"))
    +    data.+=((2L, 2, "Hello"))
    +    data.+=((4L, 2, "Hello"))
    +    data.+=((8L, 3, "Hello world"))
    +    data.+=((16L, 3, "Hello world"))
    +    val stream = env.fromCollection(data)
    +
    +    val table = stream.toTable(tEnv, 'long, 'int, 'string)
    +
    +    val windowedTable = table
    +      .groupBy('string)
    +      .window(Slide over 50.milli every 50.milli)
    +      .select('string, 'int.count)
    +
    +    // we only test if validation is successful here since processing time 
is non-deterministic
    +    windowedTable.toDataStream[Row]
    +  }
    +
    +  @Test
    +  def testProcessingTimeSlidingGroupWindowOverCount(): Unit = {
    +    val env = StreamExecutionEnvironment.getExecutionEnvironment
    +    env.setStreamTimeCharacteristic(TimeCharacteristic.EventTime)
    +    val tEnv = TableEnvironment.getTableEnvironment(env)
    +    StreamITCase.testResults = mutable.MutableList()
    +
    +    val data = new mutable.MutableList[(Long, Int, String)]
    +    data.+=((1L, 1, "Hi"))
    +    data.+=((2L, 2, "Hello"))
    +    data.+=((4L, 2, "Hello"))
    +    data.+=((8L, 3, "Hello world"))
    +    data.+=((16L, 3, "Hello world"))
    +    val stream = env.fromCollection(data)
    +
    +    val table = stream.toTable(tEnv, 'long, 'int, 'string)
    +
    +    val windowedTable = table
    +      .groupBy('string)
    +      .window(Slide over 2.rows every 1.rows)
    +      .select('string, 'int.count)
    +
    +    val results = windowedTable.toDataStream[Row]
    +    results.addSink(new StreamITCase.StringSink)
    +    env.execute()
    +
    +    val expected = Seq("Hello world,1", "Hello world,2", "Hello,1", 
"Hello,2", "Hi,1")
    +    assertEquals(expected.sorted, StreamITCase.testResults.sorted)
    +  }
    +
    +  @Test
    +  def testEventTimeSlidingGroupWindowOverTime(): Unit = {
    +    val env = StreamExecutionEnvironment.getExecutionEnvironment
    +    env.setStreamTimeCharacteristic(TimeCharacteristic.EventTime)
    +    val tEnv = TableEnvironment.getTableEnvironment(env)
    +    StreamITCase.testResults = mutable.MutableList()
    +
    +    val data = new mutable.MutableList[(Long, Int, String)]
    +    data.+=((1L, 1, "Hi"))
    +    data.+=((2L, 2, "Hello"))
    +    data.+=((4L, 2, "Hello"))
    +    data.+=((8L, 3, "Hello world"))
    +    data.+=((16L, 3, "Hello world"))
    +    val stream = env
    +      .fromCollection(data)
    +      .assignTimestampsAndWatermarks(new TimestampWithEqualWatermark())
    +
    +    val table = stream.toTable(tEnv, 'long, 'int, 'string)
    +
    +    val windowedTable = table
    +      .groupBy('string)
    +      .window(Slide over 8.milli every 10.milli on 'rowtime)
    --- End diff --
    
    The DataStream doesn't limit that either. Maybe users want to do some 
sampling with a SlidingWindow. I wouldn't limit that.


---
If your project is set up for it, you can reply to this email and have your
reply appear on GitHub as well. If your project does not have this feature
enabled and wishes so, or if the feature is enabled but not working, please
contact infrastructure at infrastruct...@apache.org or file a JIRA ticket
with INFRA.
---

Reply via email to