org.apache.flink.optimizer.testfunctions.IdentityCoGrouper Java Examples
The following examples show how to use
org.apache.flink.optimizer.testfunctions.IdentityCoGrouper.
You can vote up the ones you like or vote down the ones you don't like,
and go to the original project or source file by following the links above each example. You may check out the related API usage on the sidebar.
Example #1
Source File: BranchingPlansCompilerTest.java From Flink-CEPplus with Apache License 2.0 | 4 votes |
@SuppressWarnings("unchecked") @Test public void testBranchEachContractType() { try { // construct the plan ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); env.setParallelism(DEFAULT_PARALLELISM); DataSet<Long> sourceA = env.generateSequence(0,1); DataSet<Long> sourceB = env.generateSequence(0,1); DataSet<Long> sourceC = env.generateSequence(0,1); DataSet<Long> map1 = sourceA.map(new IdentityMapper<Long>()).name("Map 1"); DataSet<Long> reduce1 = map1.groupBy("*").reduceGroup(new IdentityGroupReducer<Long>()).name("Reduce 1"); DataSet<Long> join1 = sourceB.union(sourceB).union(sourceC) .join(sourceC).where("*").equalTo("*") .with(new IdentityJoiner<Long>()).name("Join 1"); DataSet<Long> coGroup1 = sourceA.coGroup(sourceB).where("*").equalTo("*") .with(new IdentityCoGrouper<Long>()).name("CoGroup 1"); DataSet<Long> cross1 = reduce1.cross(coGroup1) .with(new IdentityCrosser<Long>()).name("Cross 1"); DataSet<Long> coGroup2 = cross1.coGroup(cross1).where("*").equalTo("*") .with(new IdentityCoGrouper<Long>()).name("CoGroup 2"); DataSet<Long> coGroup3 = map1.coGroup(join1).where("*").equalTo("*") .with(new IdentityCoGrouper<Long>()).name("CoGroup 3"); DataSet<Long> map2 = coGroup3.map(new IdentityMapper<Long>()).name("Map 2"); DataSet<Long> coGroup4 = map2.coGroup(join1).where("*").equalTo("*") .with(new IdentityCoGrouper<Long>()).name("CoGroup 4"); DataSet<Long> coGroup5 = coGroup2.coGroup(coGroup1).where("*").equalTo("*") .with(new IdentityCoGrouper<Long>()).name("CoGroup 5"); DataSet<Long> coGroup6 = reduce1.coGroup(coGroup4).where("*").equalTo("*") .with(new IdentityCoGrouper<Long>()).name("CoGroup 6"); DataSet<Long> coGroup7 = coGroup5.coGroup(coGroup6).where("*").equalTo("*") .with(new IdentityCoGrouper<Long>()).name("CoGroup 7"); coGroup7.union(sourceA) .union(coGroup3) .union(coGroup4) .union(coGroup1) .output(new DiscardingOutputFormat<Long>()); Plan plan = env.createProgramPlan(); OptimizedPlan oPlan = compileNoStats(plan); JobGraphGenerator jobGen = new JobGraphGenerator(); //Compile plan to verify that no error is thrown jobGen.compileJobGraph(oPlan); } catch (Exception e) { e.printStackTrace(); Assert.fail(e.getMessage()); } }
Example #2
Source File: GroupOrderTest.java From Flink-CEPplus with Apache License 2.0 | 4 votes |
@Test public void testCoGroupWithGroupOrder() { // construct the plan ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); env.setParallelism(DEFAULT_PARALLELISM); DataSet<Tuple7<Long, Long, Long, Long, Long, Long, Long>> set1 = env.readCsvFile("/tmp/fake1.csv") .types(Long.class, Long.class, Long.class, Long.class, Long.class, Long.class, Long.class); DataSet<Tuple7<Long, Long, Long, Long, Long, Long, Long>> set2 = env.readCsvFile("/tmp/fake2.csv") .types(Long.class, Long.class, Long.class, Long.class, Long.class, Long.class, Long.class); set1.coGroup(set2).where(3,0).equalTo(6,0) .sortFirstGroup(5, Order.DESCENDING) .sortSecondGroup(1, Order.DESCENDING).sortSecondGroup(4, Order.ASCENDING) .with(new IdentityCoGrouper<Tuple7<Long, Long, Long, Long, Long, Long, Long>>()).name("CoGroup") .output(new DiscardingOutputFormat<Tuple7<Long, Long, Long, Long, Long, Long, Long>>()).name("Sink"); Plan plan = env.createProgramPlan(); OptimizedPlan oPlan; try { oPlan = compileNoStats(plan); } catch(CompilerException ce) { ce.printStackTrace(); fail("The pact compiler is unable to compile this plan correctly."); return; // silence the compiler } OptimizerPlanNodeResolver resolver = getOptimizerPlanNodeResolver(oPlan); SinkPlanNode sinkNode = resolver.getNode("Sink"); DualInputPlanNode coGroupNode = resolver.getNode("CoGroup"); // verify the strategies Assert.assertEquals(ShipStrategyType.FORWARD, sinkNode.getInput().getShipStrategy()); Assert.assertEquals(ShipStrategyType.PARTITION_HASH, coGroupNode.getInput1().getShipStrategy()); Assert.assertEquals(ShipStrategyType.PARTITION_HASH, coGroupNode.getInput2().getShipStrategy()); Channel c1 = coGroupNode.getInput1(); Channel c2 = coGroupNode.getInput2(); Assert.assertEquals(LocalStrategy.SORT, c1.getLocalStrategy()); Assert.assertEquals(LocalStrategy.SORT, c2.getLocalStrategy()); FieldList ship1 = new FieldList(3, 0); FieldList ship2 = new FieldList(6, 0); FieldList local1 = new FieldList(3, 0, 5); FieldList local2 = new FieldList(6, 0, 1, 4); Assert.assertEquals(ship1, c1.getShipStrategyKeys()); Assert.assertEquals(ship2, c2.getShipStrategyKeys()); Assert.assertEquals(local1, c1.getLocalStrategyKeys()); Assert.assertEquals(local2, c2.getLocalStrategyKeys()); Assert.assertTrue(c1.getLocalStrategySortOrder()[0] == coGroupNode.getSortOrders()[0]); Assert.assertTrue(c1.getLocalStrategySortOrder()[1] == coGroupNode.getSortOrders()[1]); Assert.assertTrue(c2.getLocalStrategySortOrder()[0] == coGroupNode.getSortOrders()[0]); Assert.assertTrue(c2.getLocalStrategySortOrder()[1] == coGroupNode.getSortOrders()[1]); // check that the local group orderings are correct Assert.assertEquals(false, c1.getLocalStrategySortOrder()[2]); Assert.assertEquals(false, c2.getLocalStrategySortOrder()[2]); Assert.assertEquals(true, c2.getLocalStrategySortOrder()[3]); }
Example #3
Source File: BranchingPlansCompilerTest.java From flink with Apache License 2.0 | 4 votes |
@SuppressWarnings("unchecked") @Test public void testBranchEachContractType() { try { // construct the plan ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); env.setParallelism(DEFAULT_PARALLELISM); DataSet<Long> sourceA = env.generateSequence(0,1); DataSet<Long> sourceB = env.generateSequence(0,1); DataSet<Long> sourceC = env.generateSequence(0,1); DataSet<Long> map1 = sourceA.map(new IdentityMapper<Long>()).name("Map 1"); DataSet<Long> reduce1 = map1.groupBy("*").reduceGroup(new IdentityGroupReducer<Long>()).name("Reduce 1"); DataSet<Long> join1 = sourceB.union(sourceB).union(sourceC) .join(sourceC).where("*").equalTo("*") .with(new IdentityJoiner<Long>()).name("Join 1"); DataSet<Long> coGroup1 = sourceA.coGroup(sourceB).where("*").equalTo("*") .with(new IdentityCoGrouper<Long>()).name("CoGroup 1"); DataSet<Long> cross1 = reduce1.cross(coGroup1) .with(new IdentityCrosser<Long>()).name("Cross 1"); DataSet<Long> coGroup2 = cross1.coGroup(cross1).where("*").equalTo("*") .with(new IdentityCoGrouper<Long>()).name("CoGroup 2"); DataSet<Long> coGroup3 = map1.coGroup(join1).where("*").equalTo("*") .with(new IdentityCoGrouper<Long>()).name("CoGroup 3"); DataSet<Long> map2 = coGroup3.map(new IdentityMapper<Long>()).name("Map 2"); DataSet<Long> coGroup4 = map2.coGroup(join1).where("*").equalTo("*") .with(new IdentityCoGrouper<Long>()).name("CoGroup 4"); DataSet<Long> coGroup5 = coGroup2.coGroup(coGroup1).where("*").equalTo("*") .with(new IdentityCoGrouper<Long>()).name("CoGroup 5"); DataSet<Long> coGroup6 = reduce1.coGroup(coGroup4).where("*").equalTo("*") .with(new IdentityCoGrouper<Long>()).name("CoGroup 6"); DataSet<Long> coGroup7 = coGroup5.coGroup(coGroup6).where("*").equalTo("*") .with(new IdentityCoGrouper<Long>()).name("CoGroup 7"); coGroup7.union(sourceA) .union(coGroup3) .union(coGroup4) .union(coGroup1) .output(new DiscardingOutputFormat<Long>()); Plan plan = env.createProgramPlan(); OptimizedPlan oPlan = compileNoStats(plan); JobGraphGenerator jobGen = new JobGraphGenerator(); //Compile plan to verify that no error is thrown jobGen.compileJobGraph(oPlan); } catch (Exception e) { e.printStackTrace(); Assert.fail(e.getMessage()); } }
Example #4
Source File: GroupOrderTest.java From flink with Apache License 2.0 | 4 votes |
@Test public void testCoGroupWithGroupOrder() { // construct the plan ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); env.setParallelism(DEFAULT_PARALLELISM); DataSet<Tuple7<Long, Long, Long, Long, Long, Long, Long>> set1 = env.readCsvFile("/tmp/fake1.csv") .types(Long.class, Long.class, Long.class, Long.class, Long.class, Long.class, Long.class); DataSet<Tuple7<Long, Long, Long, Long, Long, Long, Long>> set2 = env.readCsvFile("/tmp/fake2.csv") .types(Long.class, Long.class, Long.class, Long.class, Long.class, Long.class, Long.class); set1.coGroup(set2).where(3,0).equalTo(6,0) .sortFirstGroup(5, Order.DESCENDING) .sortSecondGroup(1, Order.DESCENDING).sortSecondGroup(4, Order.ASCENDING) .with(new IdentityCoGrouper<Tuple7<Long, Long, Long, Long, Long, Long, Long>>()).name("CoGroup") .output(new DiscardingOutputFormat<Tuple7<Long, Long, Long, Long, Long, Long, Long>>()).name("Sink"); Plan plan = env.createProgramPlan(); OptimizedPlan oPlan; try { oPlan = compileNoStats(plan); } catch(CompilerException ce) { ce.printStackTrace(); fail("The pact compiler is unable to compile this plan correctly."); return; // silence the compiler } OptimizerPlanNodeResolver resolver = getOptimizerPlanNodeResolver(oPlan); SinkPlanNode sinkNode = resolver.getNode("Sink"); DualInputPlanNode coGroupNode = resolver.getNode("CoGroup"); // verify the strategies Assert.assertEquals(ShipStrategyType.FORWARD, sinkNode.getInput().getShipStrategy()); Assert.assertEquals(ShipStrategyType.PARTITION_HASH, coGroupNode.getInput1().getShipStrategy()); Assert.assertEquals(ShipStrategyType.PARTITION_HASH, coGroupNode.getInput2().getShipStrategy()); Channel c1 = coGroupNode.getInput1(); Channel c2 = coGroupNode.getInput2(); Assert.assertEquals(LocalStrategy.SORT, c1.getLocalStrategy()); Assert.assertEquals(LocalStrategy.SORT, c2.getLocalStrategy()); FieldList ship1 = new FieldList(3, 0); FieldList ship2 = new FieldList(6, 0); FieldList local1 = new FieldList(3, 0, 5); FieldList local2 = new FieldList(6, 0, 1, 4); Assert.assertEquals(ship1, c1.getShipStrategyKeys()); Assert.assertEquals(ship2, c2.getShipStrategyKeys()); Assert.assertEquals(local1, c1.getLocalStrategyKeys()); Assert.assertEquals(local2, c2.getLocalStrategyKeys()); Assert.assertTrue(c1.getLocalStrategySortOrder()[0] == coGroupNode.getSortOrders()[0]); Assert.assertTrue(c1.getLocalStrategySortOrder()[1] == coGroupNode.getSortOrders()[1]); Assert.assertTrue(c2.getLocalStrategySortOrder()[0] == coGroupNode.getSortOrders()[0]); Assert.assertTrue(c2.getLocalStrategySortOrder()[1] == coGroupNode.getSortOrders()[1]); // check that the local group orderings are correct Assert.assertEquals(false, c1.getLocalStrategySortOrder()[2]); Assert.assertEquals(false, c2.getLocalStrategySortOrder()[2]); Assert.assertEquals(true, c2.getLocalStrategySortOrder()[3]); }
Example #5
Source File: BranchingPlansCompilerTest.java From flink with Apache License 2.0 | 4 votes |
@SuppressWarnings("unchecked") @Test public void testBranchEachContractType() { try { // construct the plan ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); env.setParallelism(DEFAULT_PARALLELISM); DataSet<Long> sourceA = env.generateSequence(0,1); DataSet<Long> sourceB = env.generateSequence(0,1); DataSet<Long> sourceC = env.generateSequence(0,1); DataSet<Long> map1 = sourceA.map(new IdentityMapper<Long>()).name("Map 1"); DataSet<Long> reduce1 = map1.groupBy("*").reduceGroup(new IdentityGroupReducer<Long>()).name("Reduce 1"); DataSet<Long> join1 = sourceB.union(sourceB).union(sourceC) .join(sourceC).where("*").equalTo("*") .with(new IdentityJoiner<Long>()).name("Join 1"); DataSet<Long> coGroup1 = sourceA.coGroup(sourceB).where("*").equalTo("*") .with(new IdentityCoGrouper<Long>()).name("CoGroup 1"); DataSet<Long> cross1 = reduce1.cross(coGroup1) .with(new IdentityCrosser<Long>()).name("Cross 1"); DataSet<Long> coGroup2 = cross1.coGroup(cross1).where("*").equalTo("*") .with(new IdentityCoGrouper<Long>()).name("CoGroup 2"); DataSet<Long> coGroup3 = map1.coGroup(join1).where("*").equalTo("*") .with(new IdentityCoGrouper<Long>()).name("CoGroup 3"); DataSet<Long> map2 = coGroup3.map(new IdentityMapper<Long>()).name("Map 2"); DataSet<Long> coGroup4 = map2.coGroup(join1).where("*").equalTo("*") .with(new IdentityCoGrouper<Long>()).name("CoGroup 4"); DataSet<Long> coGroup5 = coGroup2.coGroup(coGroup1).where("*").equalTo("*") .with(new IdentityCoGrouper<Long>()).name("CoGroup 5"); DataSet<Long> coGroup6 = reduce1.coGroup(coGroup4).where("*").equalTo("*") .with(new IdentityCoGrouper<Long>()).name("CoGroup 6"); DataSet<Long> coGroup7 = coGroup5.coGroup(coGroup6).where("*").equalTo("*") .with(new IdentityCoGrouper<Long>()).name("CoGroup 7"); coGroup7.union(sourceA) .union(coGroup3) .union(coGroup4) .union(coGroup1) .output(new DiscardingOutputFormat<Long>()); Plan plan = env.createProgramPlan(); OptimizedPlan oPlan = compileNoStats(plan); JobGraphGenerator jobGen = new JobGraphGenerator(); //Compile plan to verify that no error is thrown jobGen.compileJobGraph(oPlan); } catch (Exception e) { e.printStackTrace(); Assert.fail(e.getMessage()); } }
Example #6
Source File: GroupOrderTest.java From flink with Apache License 2.0 | 4 votes |
@Test public void testCoGroupWithGroupOrder() { // construct the plan ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment(); env.setParallelism(DEFAULT_PARALLELISM); DataSet<Tuple7<Long, Long, Long, Long, Long, Long, Long>> set1 = env.readCsvFile("/tmp/fake1.csv") .types(Long.class, Long.class, Long.class, Long.class, Long.class, Long.class, Long.class); DataSet<Tuple7<Long, Long, Long, Long, Long, Long, Long>> set2 = env.readCsvFile("/tmp/fake2.csv") .types(Long.class, Long.class, Long.class, Long.class, Long.class, Long.class, Long.class); set1.coGroup(set2).where(3,0).equalTo(6,0) .sortFirstGroup(5, Order.DESCENDING) .sortSecondGroup(1, Order.DESCENDING).sortSecondGroup(4, Order.ASCENDING) .with(new IdentityCoGrouper<Tuple7<Long, Long, Long, Long, Long, Long, Long>>()).name("CoGroup") .output(new DiscardingOutputFormat<Tuple7<Long, Long, Long, Long, Long, Long, Long>>()).name("Sink"); Plan plan = env.createProgramPlan(); OptimizedPlan oPlan; try { oPlan = compileNoStats(plan); } catch(CompilerException ce) { ce.printStackTrace(); fail("The pact compiler is unable to compile this plan correctly."); return; // silence the compiler } OptimizerPlanNodeResolver resolver = getOptimizerPlanNodeResolver(oPlan); SinkPlanNode sinkNode = resolver.getNode("Sink"); DualInputPlanNode coGroupNode = resolver.getNode("CoGroup"); // verify the strategies Assert.assertEquals(ShipStrategyType.FORWARD, sinkNode.getInput().getShipStrategy()); Assert.assertEquals(ShipStrategyType.PARTITION_HASH, coGroupNode.getInput1().getShipStrategy()); Assert.assertEquals(ShipStrategyType.PARTITION_HASH, coGroupNode.getInput2().getShipStrategy()); Channel c1 = coGroupNode.getInput1(); Channel c2 = coGroupNode.getInput2(); Assert.assertEquals(LocalStrategy.SORT, c1.getLocalStrategy()); Assert.assertEquals(LocalStrategy.SORT, c2.getLocalStrategy()); FieldList ship1 = new FieldList(3, 0); FieldList ship2 = new FieldList(6, 0); FieldList local1 = new FieldList(3, 0, 5); FieldList local2 = new FieldList(6, 0, 1, 4); Assert.assertEquals(ship1, c1.getShipStrategyKeys()); Assert.assertEquals(ship2, c2.getShipStrategyKeys()); Assert.assertEquals(local1, c1.getLocalStrategyKeys()); Assert.assertEquals(local2, c2.getLocalStrategyKeys()); Assert.assertTrue(c1.getLocalStrategySortOrder()[0] == coGroupNode.getSortOrders()[0]); Assert.assertTrue(c1.getLocalStrategySortOrder()[1] == coGroupNode.getSortOrders()[1]); Assert.assertTrue(c2.getLocalStrategySortOrder()[0] == coGroupNode.getSortOrders()[0]); Assert.assertTrue(c2.getLocalStrategySortOrder()[1] == coGroupNode.getSortOrders()[1]); // check that the local group orderings are correct Assert.assertEquals(false, c1.getLocalStrategySortOrder()[2]); Assert.assertEquals(false, c2.getLocalStrategySortOrder()[2]); Assert.assertEquals(true, c2.getLocalStrategySortOrder()[3]); }