org.apache.flink.api.java.typeutils.TupleTypeInfo.getBasicTupleTypeInfo java code examples

@Override
protected TupleTypeInfo<Tuple1<Integer>> createTypeInfo() {
  return TupleTypeInfo.getBasicTupleTypeInfo(Integer.class);
}

@Test(expected = CompositeType.InvalidFieldReferenceException.class)
@SuppressWarnings("unchecked")
public void testIllegalTupleField() {
  FieldAccessorFactory.getAccessor(TupleTypeInfo.getBasicTupleTypeInfo(Integer.class, Integer.class), 2, null);
}

@Test
public void testQuotedStringParsingWithEscapedQuotes() throws Exception {
  final String fileContent = "\"\\\"Hello\\\" World\"|\"We are\\\" young\"";
  final File tempFile = File.createTempFile("CsvReaderQuotedString", "tmp");
  tempFile.deleteOnExit();
  tempFile.setWritable(true);
  OutputStreamWriter writer = new OutputStreamWriter(new FileOutputStream(tempFile));
  writer.write(fileContent);
  writer.close();
  TupleTypeInfo<Tuple2<String, String>> typeInfo = TupleTypeInfo.getBasicTupleTypeInfo(String.class, String.class);
  CsvInputFormat<Tuple2<String, String>> inputFormat = new TupleCsvInputFormat<>(new Path(tempFile.toURI().toString()), typeInfo);
  inputFormat.enableQuotedStringParsing('"');
  inputFormat.setFieldDelimiter("|");
  inputFormat.setDelimiter('\n');
  inputFormat.configure(new Configuration());
  FileInputSplit[] splits = inputFormat.createInputSplits(1);
  inputFormat.open(splits[0]);
  Tuple2<String, String> record = inputFormat.nextRecord(new Tuple2<String, String>());
  assertEquals("\\\"Hello\\\" World", record.f0);
  assertEquals("We are\\\" young", record.f1);
}

@Test
public void testQuotedStringParsingWithIncludeFields() throws Exception {
  final String fileContent = "\"20:41:52-1-3-2015\"|\"Re: Taskmanager memory error in Eclipse\"|" +
      "\"Blahblah <blah@blahblah.org>\"|\"blaaa|\"blubb\"";
  final File tempFile = File.createTempFile("CsvReaderQuotedString", "tmp");
  tempFile.deleteOnExit();
  tempFile.setWritable(true);
  OutputStreamWriter writer = new OutputStreamWriter(new FileOutputStream(tempFile));
  writer.write(fileContent);
  writer.close();
  TupleTypeInfo<Tuple2<String, String>> typeInfo = TupleTypeInfo.getBasicTupleTypeInfo(String.class, String.class);
  CsvInputFormat<Tuple2<String, String>> inputFormat = new TupleCsvInputFormat<Tuple2<String, String>>(new Path(tempFile.toURI().toString()), typeInfo, new boolean[]{true, false, true});
  inputFormat.enableQuotedStringParsing('"');
  inputFormat.setFieldDelimiter("|");
  inputFormat.setDelimiter('\n');
  inputFormat.configure(new Configuration());
  FileInputSplit[] splits = inputFormat.createInputSplits(1);
  inputFormat.open(splits[0]);
  Tuple2<String, String> record = inputFormat.nextRecord(new Tuple2<String, String>());
  assertEquals("20:41:52-1-3-2015", record.f0);
  assertEquals("Blahblah <blah@blahblah.org>", record.f1);
}

wrt.close();
final TupleTypeInfo<Tuple1<String>> typeInfo = TupleTypeInfo.getBasicTupleTypeInfo(String.class);
final CsvInputFormat<Tuple1<String>> inputFormat = new TupleCsvInputFormat<Tuple1<String>>(new Path(tempFile.toURI().toString()), typeInfo);

@Test
public void testReadSparseWithPositionSetter() throws IOException {
  try {
    final String fileContent = "111|222|333|444|555|666|777|888|999|000|\n000|999|888|777|666|555|444|333|222|111|";
    final FileInputSplit split = createTempFile(fileContent);
    final TupleTypeInfo<Tuple3<Integer, Integer, Integer>> typeInfo = TupleTypeInfo.getBasicTupleTypeInfo(Integer.class, Integer.class, Integer.class);
    final CsvInputFormat<Tuple3<Integer, Integer, Integer>> format = new TupleCsvInputFormat<Tuple3<Integer, Integer, Integer>>(PATH, typeInfo, new int[]{0, 3, 7});
    format.setFieldDelimiter("|");
    format.configure(new Configuration());
    format.open(split);
    Tuple3<Integer, Integer, Integer> result = new Tuple3<Integer, Integer, Integer>();
    result = format.nextRecord(result);
    assertNotNull(result);
    assertEquals(Integer.valueOf(111), result.f0);
    assertEquals(Integer.valueOf(444), result.f1);
    assertEquals(Integer.valueOf(888), result.f2);
    result = format.nextRecord(result);
    assertNotNull(result);
    assertEquals(Integer.valueOf(000), result.f0);
    assertEquals(Integer.valueOf(777), result.f1);
    assertEquals(Integer.valueOf(333), result.f2);
    result = format.nextRecord(result);
    assertNull(result);
    assertTrue(format.reachedEnd());
  }
  catch (Exception ex) {
    fail("Test failed due to a " + ex.getClass().getName() + ": " + ex.getMessage());
  }
}

@Test
public void testReadSparseWithMask() throws IOException {
  try {
    final String fileContent = "111&&222&&333&&444&&555&&666&&777&&888&&999&&000&&\n" +
        "000&&999&&888&&777&&666&&555&&444&&333&&222&&111&&";
    final FileInputSplit split = createTempFile(fileContent);
    final TupleTypeInfo<Tuple3<Integer, Integer, Integer>> typeInfo = TupleTypeInfo.getBasicTupleTypeInfo(Integer.class, Integer.class, Integer.class);
    final CsvInputFormat<Tuple3<Integer, Integer, Integer>> format = new TupleCsvInputFormat<Tuple3<Integer, Integer, Integer>>(PATH, typeInfo, new boolean[]{true, false, false, true, false, false, false, true});
    format.setFieldDelimiter("&&");
    format.configure(new Configuration());
    format.open(split);
    Tuple3<Integer, Integer, Integer> result = new Tuple3<Integer, Integer, Integer>();
    result = format.nextRecord(result);
    assertNotNull(result);
    assertEquals(Integer.valueOf(111), result.f0);
    assertEquals(Integer.valueOf(444), result.f1);
    assertEquals(Integer.valueOf(888), result.f2);
    result = format.nextRecord(result);
    assertNotNull(result);
    assertEquals(Integer.valueOf(000), result.f0);
    assertEquals(Integer.valueOf(777), result.f1);
    assertEquals(Integer.valueOf(333), result.f2);
    result = format.nextRecord(result);
    assertNull(result);
    assertTrue(format.reachedEnd());
  }
  catch (Exception ex) {
    fail("Test failed due to a " + ex.getClass().getName() + ": " + ex.getMessage());
  }
}

@Test
public void testReadSparseWithNullFieldsForTypes() throws IOException {
  try {
    final String fileContent = "111|x|222|x|333|x|444|x|555|x|666|x|777|x|888|x|999|x|000|x|\n" +
        "000|x|999|x|888|x|777|x|666|x|555|x|444|x|333|x|222|x|111|x|";
    final FileInputSplit split = createTempFile(fileContent);
    final TupleTypeInfo<Tuple3<Integer, Integer, Integer>> typeInfo = TupleTypeInfo.getBasicTupleTypeInfo(Integer.class, Integer.class, Integer.class);
    final CsvInputFormat<Tuple3<Integer, Integer, Integer>> format = new TupleCsvInputFormat<Tuple3<Integer, Integer, Integer>>(PATH, typeInfo, new boolean[]{true, false, false, true, false, false, false, true});
    format.setFieldDelimiter("|x|");
    format.configure(new Configuration());
    format.open(split);
    Tuple3<Integer, Integer, Integer> result = new Tuple3<Integer, Integer, Integer>();
    result = format.nextRecord(result);
    assertNotNull(result);
    assertEquals(Integer.valueOf(111), result.f0);
    assertEquals(Integer.valueOf(444), result.f1);
    assertEquals(Integer.valueOf(888), result.f2);
    result = format.nextRecord(result);
    assertNotNull(result);
    assertEquals(Integer.valueOf(000), result.f0);
    assertEquals(Integer.valueOf(777), result.f1);
    assertEquals(Integer.valueOf(333), result.f2);
    result = format.nextRecord(result);
    assertNull(result);
    assertTrue(format.reachedEnd());
  }
  catch (Exception ex) {
    fail("Test failed due to a " + ex.getClass().getName() + ": " + ex.getMessage());
  }
}

@Test
public void testReadFirstN() throws IOException {
  try {
    final String fileContent = "111|222|333|444|555|\n666|777|888|999|000|\n";
    final FileInputSplit split = createTempFile(fileContent);
    final TupleTypeInfo<Tuple2<Integer, Integer>> typeInfo = TupleTypeInfo.getBasicTupleTypeInfo(Integer.class, Integer.class);
    final CsvInputFormat<Tuple2<Integer, Integer>> format = new TupleCsvInputFormat<Tuple2<Integer, Integer>>(PATH, typeInfo);
    format.setFieldDelimiter("|");
    format.configure(new Configuration());
    format.open(split);
    Tuple2<Integer, Integer> result = new Tuple2<Integer, Integer>();
    result = format.nextRecord(result);
    assertNotNull(result);
    assertEquals(Integer.valueOf(111), result.f0);
    assertEquals(Integer.valueOf(222), result.f1);
    result = format.nextRecord(result);
    assertNotNull(result);
    assertEquals(Integer.valueOf(666), result.f0);
    assertEquals(Integer.valueOf(777), result.f1);
    result = format.nextRecord(result);
    assertNull(result);
    assertTrue(format.reachedEnd());
  }
  catch (Exception ex) {
    fail("Test failed due to a " + ex.getClass().getName() + ": " + ex.getMessage());
  }
}

/**
 * Tests cross program with replicated data source.
 */
@Test
public void checkCrossWithReplicatedSourceInput() {
  ExecutionEnvironment env = ExecutionEnvironment.createLocalEnvironment();
  env.setParallelism(DEFAULT_PARALLELISM);
  TupleTypeInfo<Tuple1<String>> typeInfo = TupleTypeInfo.getBasicTupleTypeInfo(String.class);
  ReplicatingInputFormat<Tuple1<String>, FileInputSplit> rif =
      new ReplicatingInputFormat<Tuple1<String>, FileInputSplit>(new TupleCsvInputFormat<Tuple1<String>>(new Path("/some/path"), typeInfo));
  DataSet<Tuple1<String>> source1 = env.createInput(rif, new TupleTypeInfo<Tuple1<String>>(BasicTypeInfo.STRING_TYPE_INFO));
  DataSet<Tuple1<String>> source2 = env.readCsvFile("/some/otherpath").types(String.class);
  DataSink<Tuple2<Tuple1<String>, Tuple1<String>>> out = source1
      .cross(source2)
      .writeAsText("/some/newpath");
  Plan plan = env.createProgramPlan();
  // submit the plan to the compiler
  OptimizedPlan oPlan = compileNoStats(plan);
  // check the optimized Plan
  // when cross should have forward strategy on both sides
  SinkPlanNode sinkNode = oPlan.getDataSinks().iterator().next();
  DualInputPlanNode crossNode = (DualInputPlanNode) sinkNode.getPredecessor();
  ShipStrategyType crossIn1 = crossNode.getInput1().getShipStrategy();
  ShipStrategyType crossIn2 = crossNode.getInput2().getShipStrategy();
  Assert.assertEquals("Invalid ship strategy for an operator.", ShipStrategyType.FORWARD, crossIn1);
  Assert.assertEquals("Invalid ship strategy for an operator.", ShipStrategyType.FORWARD, crossIn2);
}

/**
 * Tests join program with replicated data source.
 */
@Test
public void checkJoinWithReplicatedSourceInput() {
  ExecutionEnvironment env = ExecutionEnvironment.createLocalEnvironment();
  env.setParallelism(DEFAULT_PARALLELISM);
  TupleTypeInfo<Tuple1<String>> typeInfo = TupleTypeInfo.getBasicTupleTypeInfo(String.class);
  ReplicatingInputFormat<Tuple1<String>, FileInputSplit> rif =
      new ReplicatingInputFormat<Tuple1<String>, FileInputSplit>(new TupleCsvInputFormat<Tuple1<String>>(new Path("/some/path"), typeInfo));
  DataSet<Tuple1<String>> source1 = env.createInput(rif, new TupleTypeInfo<Tuple1<String>>(BasicTypeInfo.STRING_TYPE_INFO));
  DataSet<Tuple1<String>> source2 = env.readCsvFile("/some/otherpath").types(String.class);
  DataSink<Tuple2<Tuple1<String>, Tuple1<String>>> out = source1
      .join(source2).where("*").equalTo("*")
      .writeAsText("/some/newpath");
  Plan plan = env.createProgramPlan();
  // submit the plan to the compiler
  OptimizedPlan oPlan = compileNoStats(plan);
  // check the optimized Plan
  // when join should have forward strategy on both sides
  SinkPlanNode sinkNode = oPlan.getDataSinks().iterator().next();
  DualInputPlanNode joinNode = (DualInputPlanNode) sinkNode.getPredecessor();
  ShipStrategyType joinIn1 = joinNode.getInput1().getShipStrategy();
  ShipStrategyType joinIn2 = joinNode.getInput2().getShipStrategy();
  Assert.assertEquals("Invalid ship strategy for an operator.", ShipStrategyType.FORWARD, joinIn1);
  Assert.assertEquals("Invalid ship strategy for an operator.", ShipStrategyType.FORWARD, joinIn2);
}

/**
 * Tests join program with replicated data source behind map.
 */
@Test
public void checkJoinWithReplicatedSourceInputBehindMap() {
  ExecutionEnvironment env = ExecutionEnvironment.createLocalEnvironment();
  env.setParallelism(DEFAULT_PARALLELISM);
  TupleTypeInfo<Tuple1<String>> typeInfo = TupleTypeInfo.getBasicTupleTypeInfo(String.class);
  ReplicatingInputFormat<Tuple1<String>, FileInputSplit> rif =
      new ReplicatingInputFormat<Tuple1<String>, FileInputSplit>(new TupleCsvInputFormat<Tuple1<String>>(new Path("/some/path"), typeInfo));
  DataSet<Tuple1<String>> source1 = env.createInput(rif, new TupleTypeInfo<Tuple1<String>>(BasicTypeInfo.STRING_TYPE_INFO));
  DataSet<Tuple1<String>> source2 = env.readCsvFile("/some/otherpath").types(String.class);
  DataSink<Tuple2<Tuple1<String>, Tuple1<String>>> out = source1
      .map(new IdMap())
      .join(source2).where("*").equalTo("*")
      .writeAsText("/some/newpath");
  Plan plan = env.createProgramPlan();
  // submit the plan to the compiler
  OptimizedPlan oPlan = compileNoStats(plan);
  // check the optimized Plan
  // when join should have forward strategy on both sides
  SinkPlanNode sinkNode = oPlan.getDataSinks().iterator().next();
  DualInputPlanNode joinNode = (DualInputPlanNode) sinkNode.getPredecessor();
  ShipStrategyType joinIn1 = joinNode.getInput1().getShipStrategy();
  ShipStrategyType joinIn2 = joinNode.getInput2().getShipStrategy();
  Assert.assertEquals("Invalid ship strategy for an operator.", ShipStrategyType.FORWARD, joinIn1);
  Assert.assertEquals("Invalid ship strategy for an operator.", ShipStrategyType.FORWARD, joinIn2);
}

/**
 * Tests join program with replicated data source behind flatMap.
 */
@Test
public void checkJoinWithReplicatedSourceInputBehindFlatMap() {
  ExecutionEnvironment env = ExecutionEnvironment.createLocalEnvironment();
  env.setParallelism(DEFAULT_PARALLELISM);
  TupleTypeInfo<Tuple1<String>> typeInfo = TupleTypeInfo.getBasicTupleTypeInfo(String.class);
  ReplicatingInputFormat<Tuple1<String>, FileInputSplit> rif =
      new ReplicatingInputFormat<Tuple1<String>, FileInputSplit>(new TupleCsvInputFormat<Tuple1<String>>(new Path("/some/path"), typeInfo));
  DataSet<Tuple1<String>> source1 = env.createInput(rif, new TupleTypeInfo<Tuple1<String>>(BasicTypeInfo.STRING_TYPE_INFO));
  DataSet<Tuple1<String>> source2 = env.readCsvFile("/some/otherpath").types(String.class);
  DataSink<Tuple2<Tuple1<String>, Tuple1<String>>> out = source1
      .flatMap(new IdFlatMap())
      .join(source2).where("*").equalTo("*")
      .writeAsText("/some/newpath");
  Plan plan = env.createProgramPlan();
  // submit the plan to the compiler
  OptimizedPlan oPlan = compileNoStats(plan);
  // check the optimized Plan
  // when join should have forward strategy on both sides
  SinkPlanNode sinkNode = oPlan.getDataSinks().iterator().next();
  DualInputPlanNode joinNode = (DualInputPlanNode) sinkNode.getPredecessor();
  ShipStrategyType joinIn1 = joinNode.getInput1().getShipStrategy();
  ShipStrategyType joinIn2 = joinNode.getInput2().getShipStrategy();
  Assert.assertEquals("Invalid ship strategy for an operator.", ShipStrategyType.FORWARD, joinIn1);
  Assert.assertEquals("Invalid ship strategy for an operator.", ShipStrategyType.FORWARD, joinIn2);
}

/**
 * Tests join program with replicated data source behind map partition.
 */
@Test
public void checkJoinWithReplicatedSourceInputBehindMapPartition() {
  ExecutionEnvironment env = ExecutionEnvironment.createLocalEnvironment();
  env.setParallelism(DEFAULT_PARALLELISM);
  TupleTypeInfo<Tuple1<String>> typeInfo = TupleTypeInfo.getBasicTupleTypeInfo(String.class);
  ReplicatingInputFormat<Tuple1<String>, FileInputSplit> rif =
      new ReplicatingInputFormat<Tuple1<String>, FileInputSplit>(new TupleCsvInputFormat<Tuple1<String>>(new Path("/some/path"), typeInfo));
  DataSet<Tuple1<String>> source1 = env.createInput(rif, new TupleTypeInfo<Tuple1<String>>(BasicTypeInfo.STRING_TYPE_INFO));
  DataSet<Tuple1<String>> source2 = env.readCsvFile("/some/otherpath").types(String.class);
  DataSink<Tuple2<Tuple1<String>, Tuple1<String>>> out = source1
      .mapPartition(new IdPMap())
      .join(source2).where("*").equalTo("*")
      .writeAsText("/some/newpath");
  Plan plan = env.createProgramPlan();
  // submit the plan to the compiler
  OptimizedPlan oPlan = compileNoStats(plan);
  // check the optimized Plan
  // when join should have forward strategy on both sides
  SinkPlanNode sinkNode = oPlan.getDataSinks().iterator().next();
  DualInputPlanNode joinNode = (DualInputPlanNode) sinkNode.getPredecessor();
  ShipStrategyType joinIn1 = joinNode.getInput1().getShipStrategy();
  ShipStrategyType joinIn2 = joinNode.getInput2().getShipStrategy();
  Assert.assertEquals("Invalid ship strategy for an operator.", ShipStrategyType.FORWARD, joinIn1);
  Assert.assertEquals("Invalid ship strategy for an operator.", ShipStrategyType.FORWARD, joinIn2);
}

/**
 * Tests join program with replicated data source behind filter.
 */
@Test
public void checkJoinWithReplicatedSourceInputBehindFilter() {
  ExecutionEnvironment env = ExecutionEnvironment.createLocalEnvironment();
  env.setParallelism(DEFAULT_PARALLELISM);
  TupleTypeInfo<Tuple1<String>> typeInfo = TupleTypeInfo.getBasicTupleTypeInfo(String.class);
  ReplicatingInputFormat<Tuple1<String>, FileInputSplit> rif =
      new ReplicatingInputFormat<Tuple1<String>, FileInputSplit>(new TupleCsvInputFormat<Tuple1<String>>(new Path("/some/path"), typeInfo));
  DataSet<Tuple1<String>> source1 = env.createInput(rif, new TupleTypeInfo<Tuple1<String>>(BasicTypeInfo.STRING_TYPE_INFO));
  DataSet<Tuple1<String>> source2 = env.readCsvFile("/some/otherpath").types(String.class);
  DataSink<Tuple2<Tuple1<String>, Tuple1<String>>> out = source1
      .filter(new NoFilter())
      .join(source2).where("*").equalTo("*")
      .writeAsText("/some/newpath");
  Plan plan = env.createProgramPlan();
  // submit the plan to the compiler
  OptimizedPlan oPlan = compileNoStats(plan);
  // check the optimized Plan
  // when join should have forward strategy on both sides
  SinkPlanNode sinkNode = oPlan.getDataSinks().iterator().next();
  DualInputPlanNode joinNode = (DualInputPlanNode) sinkNode.getPredecessor();
  ShipStrategyType joinIn1 = joinNode.getInput1().getShipStrategy();
  ShipStrategyType joinIn2 = joinNode.getInput2().getShipStrategy();
  Assert.assertEquals("Invalid ship strategy for an operator.", ShipStrategyType.FORWARD, joinIn1);
  Assert.assertEquals("Invalid ship strategy for an operator.", ShipStrategyType.FORWARD, joinIn2);
}

/**
 * Tests cross program with replicated data source behind map and filter.
 */
@Test
public void checkCrossWithReplicatedSourceInputBehindMap() {
  ExecutionEnvironment env = ExecutionEnvironment.createLocalEnvironment();
  env.setParallelism(DEFAULT_PARALLELISM);
  TupleTypeInfo<Tuple1<String>> typeInfo = TupleTypeInfo.getBasicTupleTypeInfo(String.class);
  ReplicatingInputFormat<Tuple1<String>, FileInputSplit> rif =
      new ReplicatingInputFormat<Tuple1<String>, FileInputSplit>(new TupleCsvInputFormat<Tuple1<String>>(new Path("/some/path"), typeInfo));
  DataSet<Tuple1<String>> source1 = env.createInput(rif, new TupleTypeInfo<Tuple1<String>>(BasicTypeInfo.STRING_TYPE_INFO));
  DataSet<Tuple1<String>> source2 = env.readCsvFile("/some/otherpath").types(String.class);
  DataSink<Tuple2<Tuple1<String>, Tuple1<String>>> out = source1
      .map(new IdMap())
      .filter(new NoFilter())
      .cross(source2)
      .writeAsText("/some/newpath");
  Plan plan = env.createProgramPlan();
  // submit the plan to the compiler
  OptimizedPlan oPlan = compileNoStats(plan);
  // check the optimized Plan
  // when cross should have forward strategy on both sides
  SinkPlanNode sinkNode = oPlan.getDataSinks().iterator().next();
  DualInputPlanNode crossNode = (DualInputPlanNode) sinkNode.getPredecessor();
  ShipStrategyType crossIn1 = crossNode.getInput1().getShipStrategy();
  ShipStrategyType crossIn2 = crossNode.getInput2().getShipStrategy();
  Assert.assertEquals("Invalid ship strategy for an operator.", ShipStrategyType.FORWARD, crossIn1);
  Assert.assertEquals("Invalid ship strategy for an operator.", ShipStrategyType.FORWARD, crossIn2);
}

/**
 * Tests compiler fail for join program with replicated data source and changing parallelism.
 */
@Test(expected = CompilerException.class)
public void checkJoinWithReplicatedSourceInputChangingparallelism() {
  ExecutionEnvironment env = ExecutionEnvironment.createLocalEnvironment();
  env.setParallelism(DEFAULT_PARALLELISM);
  TupleTypeInfo<Tuple1<String>> typeInfo = TupleTypeInfo.getBasicTupleTypeInfo(String.class);
  ReplicatingInputFormat<Tuple1<String>, FileInputSplit> rif =
      new ReplicatingInputFormat<Tuple1<String>, FileInputSplit>(new TupleCsvInputFormat<Tuple1<String>>(new Path("/some/path"), typeInfo));
  DataSet<Tuple1<String>> source1 = env.createInput(rif, new TupleTypeInfo<Tuple1<String>>(BasicTypeInfo.STRING_TYPE_INFO));
  DataSet<Tuple1<String>> source2 = env.readCsvFile("/some/otherpath").types(String.class);
  DataSink<Tuple2<Tuple1<String>, Tuple1<String>>> out = source1
      .join(source2).where("*").equalTo("*").setParallelism(DEFAULT_PARALLELISM+2)
      .writeAsText("/some/newpath");
  Plan plan = env.createProgramPlan();
  // submit the plan to the compiler
  OptimizedPlan oPlan = compileNoStats(plan);
}

/**
 * Tests compiler fail for join program with replicated data source behind rebalance.
 */
@Test(expected = CompilerException.class)
public void checkJoinWithReplicatedSourceInputBehindRebalance() {
  ExecutionEnvironment env = ExecutionEnvironment.createLocalEnvironment();
  env.setParallelism(DEFAULT_PARALLELISM);
  TupleTypeInfo<Tuple1<String>> typeInfo = TupleTypeInfo.getBasicTupleTypeInfo(String.class);
  ReplicatingInputFormat<Tuple1<String>, FileInputSplit> rif =
      new ReplicatingInputFormat<Tuple1<String>, FileInputSplit>(new TupleCsvInputFormat<Tuple1<String>>(new Path("/some/path"), typeInfo));
  DataSet<Tuple1<String>> source1 = env.createInput(rif, new TupleTypeInfo<Tuple1<String>>(BasicTypeInfo.STRING_TYPE_INFO));
  DataSet<Tuple1<String>> source2 = env.readCsvFile("/some/otherpath").types(String.class);
  DataSink<Tuple2<Tuple1<String>, Tuple1<String>>> out = source1
      .rebalance()
      .join(source2).where("*").equalTo("*")
      .writeAsText("/some/newpath");
  Plan plan = env.createProgramPlan();
  // submit the plan to the compiler
  OptimizedPlan oPlan = compileNoStats(plan);
}

/**
 * Tests compiler fail for join program with replicated data source behind reduce.
 */
@Test(expected = CompilerException.class)
public void checkJoinWithReplicatedSourceInputBehindReduce() {
  ExecutionEnvironment env = ExecutionEnvironment.createLocalEnvironment();
  env.setParallelism(DEFAULT_PARALLELISM);
  TupleTypeInfo<Tuple1<String>> typeInfo = TupleTypeInfo.getBasicTupleTypeInfo(String.class);
  ReplicatingInputFormat<Tuple1<String>, FileInputSplit> rif =
      new ReplicatingInputFormat<Tuple1<String>, FileInputSplit>(new TupleCsvInputFormat<Tuple1<String>>(new Path("/some/path"), typeInfo));
  DataSet<Tuple1<String>> source1 = env.createInput(rif, new TupleTypeInfo<Tuple1<String>>(BasicTypeInfo.STRING_TYPE_INFO));
  DataSet<Tuple1<String>> source2 = env.readCsvFile("/some/otherpath").types(String.class);
  DataSink<Tuple2<Tuple1<String>, Tuple1<String>>> out = source1
      .reduce(new LastReduce())
      .join(source2).where("*").equalTo("*")
      .writeAsText("/some/newpath");
  Plan plan = env.createProgramPlan();
  // submit the plan to the compiler
  OptimizedPlan oPlan = compileNoStats(plan);
}

/**
 * Tests compiler fail for join program with replicated data source behind map and changing parallelism.
 */
@Test(expected = CompilerException.class)
public void checkJoinWithReplicatedSourceInputBehindMapChangingparallelism() {
  ExecutionEnvironment env = ExecutionEnvironment.createLocalEnvironment();
  env.setParallelism(DEFAULT_PARALLELISM);
  TupleTypeInfo<Tuple1<String>> typeInfo = TupleTypeInfo.getBasicTupleTypeInfo(String.class);
  ReplicatingInputFormat<Tuple1<String>, FileInputSplit> rif =
      new ReplicatingInputFormat<Tuple1<String>, FileInputSplit>(new TupleCsvInputFormat<Tuple1<String>>(new Path("/some/path"), typeInfo));
  DataSet<Tuple1<String>> source1 = env.createInput(rif, new TupleTypeInfo<Tuple1<String>>(BasicTypeInfo.STRING_TYPE_INFO));
  DataSet<Tuple1<String>> source2 = env.readCsvFile("/some/otherpath").types(String.class);
  DataSink<Tuple2<Tuple1<String>, Tuple1<String>>> out = source1
      .map(new IdMap()).setParallelism(DEFAULT_PARALLELISM+1)
      .join(source2).where("*").equalTo("*")
      .writeAsText("/some/newpath");
  Plan plan = env.createProgramPlan();
  // submit the plan to the compiler
  OptimizedPlan oPlan = compileNoStats(plan);
}

Popular methods of TupleTypeInfo

getFlatFields

Popular in Java

Start an intent from android
requestLocationUpdates (LocationManager)
onCreateOptionsMenu (Activity)
scheduleAtFixedRate (Timer)
FileNotFoundException (java.io)
Thrown when a file specified by a program cannot be found.
InetAddress (java.net)
An Internet Protocol (IP) address. This can be either an IPv4 address or an IPv6 address, and in pra
ServerSocket (java.net)
This class represents a server-side socket that waits for incoming client connections. A ServerSocke
Timestamp (java.sql)
A Java representation of the SQL TIMESTAMP type. It provides the capability of representing the SQL
TimerTask (java.util)
The TimerTask class represents a task to run at a specified time. The task may be run once or repeat
Logger (org.apache.log4j)
This is the central class in the log4j package. Most logging operations, except configuration, are d
Top Sublime Text plugins

How to use getBasicTupleTypeInfomethodin org.apache.flink.api.java.typeutils.TupleTypeInfo

Best Java code snippets using org.apache.flink.api.java.typeutils.TupleTypeInfo.getBasicTupleTypeInfo (Showing top 20 results out of 315)

How to use
getBasicTupleTypeInfo
method
in
org.apache.flink.api.java.typeutils.TupleTypeInfo