@Test(expected = IndexOutOfBoundsException.class) public void testGroupByKeyFields4() { final ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); DataSet<Tuple5<Integer, Long, String, Long, Integer>> tupleDs = env.fromCollection(emptyTupleData, tupleTypeInfo); // should not work, key out of tuple bounds tupleDs.groupBy(5); }
@Override protected void testProgram() throws Exception { final ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); DataSet<String> text = env.fromElements(WordCountData.TEXT); DataSet<Tuple2<String, Integer>> words = text.flatMap(new WordCount.Tokenizer()); DataSet<Tuple2<String, Integer>> result = words.groupBy(0).aggregate(Aggregations.SUM, 1); result.output(new LocalCollectionOutputFormat<Tuple2<String, Integer>>(resultsCollected)); env.execute("Word Count Collection"); } }
@Test(expected = InvalidProgramException.class) public void testGroupAtomicTypeWithInvalid2() { final ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); DataSet<Integer> dataSet = env.fromElements(0, 1, 2, 3); dataSet.groupBy("invalidField"); }
@Test(expected = IndexOutOfBoundsException.class) public void testGroupByKeyFields5() { final ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); DataSet<Tuple5<Integer, Long, String, Long, Integer>> tupleDs = env.fromCollection(emptyTupleData, tupleTypeInfo); // should not work, negative field position tupleDs.groupBy(-1); }
@Test public void testGroupingAtomicType() { final ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); DataSet<Integer> dataSet = env.fromElements(0, 1, 1, 2, 0, 0); dataSet.groupBy("*"); }
@Test(expected = InvalidProgramException.class) public void testGroupByKeyFields2() { final ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); DataSet<Long> longDs = env.fromCollection(emptyLongData, BasicTypeInfo.LONG_TYPE_INFO); // should not work: groups on basic type longDs.groupBy(0); }
@Test(expected = InvalidProgramException.class) public void testGroupByKeyExpressions2() { final ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); DataSet<Long> longDs = env.fromCollection(emptyLongData, BasicTypeInfo.LONG_TYPE_INFO); // should not work: groups on basic type longDs.groupBy("myInt"); }
@Test(expected = IllegalArgumentException.class) public void testGroupByKeyExpressions4() { final ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); DataSet<CustomType> ds = env.fromCollection(customTypeData); // should not work, key out of tuple bounds ds.groupBy("myNonExistent"); }
@Test(expected = InvalidProgramException.class) public void testGroupAtomicTypeWithInvalid1() { final ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); DataSet<Integer> dataSet = env.fromElements(0, 1, 2, 3); dataSet.groupBy("*", "invalidField"); }
@Test(expected = InvalidProgramException.class) public void testGroupAtomicTypeWithInvalid3() { final ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); DataSet<ArrayList<Integer>> dataSet = env.fromElements(new ArrayList<Integer>()); dataSet.groupBy("*"); }
@Test(expected = IllegalArgumentException.class) public void testGroupByKeyExpressions2Nested() { final ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); DataSet<CustomType> ds = env.fromCollection(customTypeData); // should not work, key out of tuple bounds ds.groupBy("nested.myNonExistent"); }
@Test(expected = InvalidProgramException.class) public void testGroupByKeyFields3() { final ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); this.customTypeData.add(new CustomType()); DataSet<CustomType> customDs = env.fromCollection(customTypeData); // should not work: groups on custom type customDs.groupBy(0); }
@Test public void testGroupByKeyFieldsOnPrimitiveArray() { this.byteArrayData.add(new Tuple2(new byte[]{0}, new byte[]{1})); final ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); DataSet<Tuple2<byte[], byte[]>> tupleDs = env.fromCollection(byteArrayData); tupleDs.groupBy(0); }
@Test(expected = InvalidProgramException.class) public void testGroupByKeyExpressions3() { final ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); this.customTypeData.add(new CustomType()); DataSet<CustomType> customDs = env.fromCollection(customTypeData); // should not work: tuple selector on custom type customDs.groupBy(0); }
@Test(expected = InvalidProgramException.class) public void testGroupSortKeyFields4() { final ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); DataSet<Tuple4<Integer, Long, CustomType, Long[]>> tupleDs = env.fromCollection(tupleWithCustomData, tupleWithCustomInfo); // should not work tupleDs.groupBy(0) .sortGroup(2, Order.ASCENDING); }
@Test(expected = IndexOutOfBoundsException.class) public void testGroupSortKeyFields2() { final ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); DataSet<Tuple5<Integer, Long, String, Long, Integer>> tupleDs = env.fromCollection(emptyTupleData, tupleTypeInfo); // should not work, field index out of bounds tupleDs.groupBy(0).sortGroup(5, Order.ASCENDING); }
@Test(expected = InvalidProgramException.class) public void testGroupSortByKeyExpression6() { final ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); DataSet<Tuple4<Integer, Long, CustomType, Long[]>> tupleDs = env.fromCollection(tupleWithCustomData, tupleWithCustomInfo); // should not work tupleDs.groupBy("f0") .sortGroup("f3", Order.ASCENDING); }
@Test(expected = InvalidProgramException.class) public void testGroupSortKeyFields5() { final ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); DataSet<Tuple4<Integer, Long, CustomType, Long[]>> tupleDs = env.fromCollection(tupleWithCustomData, tupleWithCustomInfo); // should not work tupleDs.groupBy(0) .sortGroup(3, Order.ASCENDING); }
@Test public void testGroupByKeyFields1() { final ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); DataSet<Tuple5<Integer, Long, String, Long, Integer>> tupleDs = env.fromCollection(emptyTupleData, tupleTypeInfo); // should work try { tupleDs.groupBy(0); } catch (Exception e) { Assert.fail(); } }
@Test(expected = InvalidProgramException.class) public void testGroupSortByKeyExpression4() { final ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); DataSet<Tuple4<Integer, Long, CustomType, Long[]>> tupleDs = env.fromCollection(tupleWithCustomData, tupleWithCustomInfo); // should not work tupleDs.groupBy("f0") .sortGroup("f2", Order.ASCENDING); }