org.apache.flink.test.util.TestUtils Java Examples
The following examples show how to use
org.apache.flink.test.util.TestUtils.
You can vote up the ones you like or vote down the ones you don't like,
and go to the original project or source file by following the links above each example. You may check out the related API usage on the sidebar.
Example #1
Source File: StreamFaultToleranceTestBase.java From Flink-CEPplus with Apache License 2.0 | 6 votes |
/** * Runs the following program the test program defined in {@link #testProgram(StreamExecutionEnvironment)} * followed by the checks in {@link #postSubmit}. */ @Test public void runCheckpointedProgram() throws Exception { try { StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment(); env.setParallelism(PARALLELISM); env.enableCheckpointing(500); env.getConfig().disableSysoutLogging(); env.setRestartStrategy(RestartStrategies.fixedDelayRestart(Integer.MAX_VALUE, 0L)); testProgram(env); TestUtils.tryExecute(env, "Fault Tolerance Test"); postSubmit(); } catch (Exception e) { e.printStackTrace(); Assert.fail(e.getMessage()); } }
Example #2
Source File: FlinkPulsarITest.java From pulsar-flink with Apache License 2.0 | 6 votes |
@Test public void testStartFromSpecific() throws Exception { String topic = newTopic(); List<MessageId> mids = sendTypedMessages(topic, SchemaType.INT32, Arrays.asList( // 0, 1, 2, 3, 4, 5, 6, 7, 8 -20, -21, -22, 1, 2, 3, 10, 11, 12), Optional.empty()); Map<String, Set<Integer>> expectedData = new HashMap<>(); expectedData.put(topic, new HashSet<>(Arrays.asList(2, 3, 10, 11, 12))); Map<String, MessageId> offset = new HashMap<>(); offset.put(topic, mids.get(3)); StreamExecutionEnvironment see = StreamExecutionEnvironment.getExecutionEnvironment(); see.getConfig().disableSysoutLogging(); see.setParallelism(1); Properties sourceProps = sourceProperties(); sourceProps.setProperty(TOPIC_SINGLE_OPTION_KEY, topic); DataStream stream = see.addSource( new FlinkPulsarRowSource(serviceUrl, adminUrl, sourceProps).setStartFromSpecificOffsets(offset)); stream.flatMap(new CheckAllMessageExist(expectedData, 5)).setParallelism(1); TestUtils.tryExecute(see, "start from specific"); }
Example #3
Source File: FlinkPulsarITest.java From pulsar-flink with Apache License 2.0 | 5 votes |
@Test public void testProduceConsumeMultipleTopics() throws Exception { int numTopic = 5; int numElements = 20; StreamExecutionEnvironment see = StreamExecutionEnvironment.getExecutionEnvironment(); see.getConfig().disableSysoutLogging(); see.setParallelism(1); List<String> topics = new ArrayList<>(); for (int i = 0; i < numTopic; i++) { topics.add(newTopic()); } DataStream<Row> stream = see.addSource(new MultiTopicSource(topics, numElements)); Properties sinkProp = sinkProperties(); produceIntoPulsar(stream, intRowWithTopicType(), sinkProp); see.execute("write with topics"); StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment(); env.getConfig().disableSysoutLogging(); Properties sourceProp = sourceProperties(); sourceProp.setProperty(TOPIC_MULTI_OPTION_KEY, StringUtils.join(topics.toArray(), ',')); DataStream<Row> stream1 = env.addSource(new FlinkPulsarRowSource(serviceUrl, adminUrl, sourceProp).setStartFromEarliest()); stream1.flatMap(new CountMessageNumberFM(numElements)).setParallelism(1); TestUtils.tryExecute(env, "count elements from topics"); }
Example #4
Source File: FlinkPulsarITest.java From pulsar-flink with Apache License 2.0 | 5 votes |
@Test public void testStartFromEarliest() throws Exception { int numTopic = 3; List<Integer> messages = IntStream.range(0, 50).boxed().collect(Collectors.toList()); List<String> topics = new ArrayList<>(); Map<String, Set<Integer>> expectedData = new HashMap<>(); for (int i = 0; i < numTopic; i++) { String topic = newTopic(); topics.add(topic); sendTypedMessages(topic, SchemaType.INT32, messages, Optional.empty()); expectedData.put(topic, new HashSet<>(messages)); } StreamExecutionEnvironment see = StreamExecutionEnvironment.getExecutionEnvironment(); see.getConfig().disableSysoutLogging(); see.setParallelism(3); Properties sourceProps = sourceProperties(); sourceProps.setProperty(TOPIC_MULTI_OPTION_KEY, StringUtils.join(topics, ',')); DataStream stream = see.addSource( new FlinkPulsarRowSource(serviceUrl, adminUrl, sourceProps).setStartFromEarliest()); stream.flatMap(new CheckAllMessageExist(expectedData, 150)).setParallelism(1); TestUtils.tryExecute(see, "start from earliest"); }
Example #5
Source File: FlinkPulsarITest.java From pulsar-flink with Apache License 2.0 | 5 votes |
@Test public void testStartFromExternalSubscription() throws Exception { String topic = newTopic(); List<MessageId> mids = sendTypedMessages(topic, SchemaType.INT32, Arrays.asList( // 0, 1, 2, 3, 4, 5, 6, 7, 8 -20, -21, -22, 1, 2, 3, 10, 11, 12), Optional.empty()); String subName = "sub-1"; PulsarAdmin admin = PulsarAdmin.builder().serviceHttpUrl(adminUrl).build(); admin.topics().createSubscription(TopicName.get(topic).toString(), subName, mids.get(3)); Map<String, Set<Integer>> expectedData = new HashMap<>(); expectedData.put(topic, new HashSet<>(Arrays.asList(2, 3, 10, 11, 12))); StreamExecutionEnvironment see = StreamExecutionEnvironment.getExecutionEnvironment(); see.getConfig().disableSysoutLogging(); see.setParallelism(1); Properties sourceProps = sourceProperties(); sourceProps.setProperty(TOPIC_SINGLE_OPTION_KEY, topic); DataStream stream = see.addSource( new FlinkPulsarRowSource(serviceUrl, adminUrl, sourceProps).setStartFromSubscription(subName)); stream.flatMap(new CheckAllMessageExist(expectedData, 5)).setParallelism(1); TestUtils.tryExecute(see, "start from specific"); assertTrue(Sets.newHashSet(admin.topics().getSubscriptions(topic)).contains(subName)); admin.close(); }
Example #6
Source File: FlinkPulsarITest.java From pulsar-flink with Apache License 2.0 | 5 votes |
@Test public void testOne2OneExactlyOnce() throws Exception { String topic = newTopic(); int parallelism = 5; int numElementsPerPartition = 1000; int totalElements = parallelism * numElementsPerPartition; int failAfterElements = numElementsPerPartition / 3; List<String> allTopicNames = new ArrayList<>(); for (int i = 0; i < parallelism; i++) { allTopicNames.add(topic + "-partition-" + i); } createTopic(topic, parallelism, adminUrl); generateRandomizedIntegerSequence( StreamExecutionEnvironment.getExecutionEnvironment(), topic, parallelism, numElementsPerPartition, true); // run the topology that fails and recovers StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment(); env.enableCheckpointing(500); env.setParallelism(parallelism); env.setRestartStrategy(RestartStrategies.fixedDelayRestart(1, 0)); env.getConfig().disableSysoutLogging(); Properties sourceProps = sourceProperties(); sourceProps.setProperty(TOPIC_MULTI_OPTION_KEY, StringUtils.join(allTopicNames, ',')); env.addSource(new FlinkPulsarRowSource(serviceUrl, adminUrl, sourceProps).setStartFromEarliest()) .map(new PartitionValidationMapper(parallelism, 1)) .map(new FailingIdentityMapper<Row>(failAfterElements)) .addSink(new ValidatingExactlyOnceSink(totalElements)).setParallelism(1); FailingIdentityMapper.failedBefore = false; TestUtils.tryExecute(env, "one to one exactly once test"); }
Example #7
Source File: FlinkPulsarITest.java From pulsar-flink with Apache License 2.0 | 5 votes |
@Test public void testOne2MultiSource() throws Exception { String topic = newTopic(); int numPartitions = 5; int numElementsPerPartition = 1000; int totalElements = numPartitions * numElementsPerPartition; int failAfterElements = numElementsPerPartition / 3; List<String> allTopicNames = new ArrayList<>(); for (int i = 0; i < numPartitions; i++) { allTopicNames.add(topic + "-partition-" + i); } createTopic(topic, numPartitions, adminUrl); generateRandomizedIntegerSequence( StreamExecutionEnvironment.getExecutionEnvironment(), topic, numPartitions, numElementsPerPartition, true); int parallelism = 2; // run the topology that fails and recovers StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment(); env.enableCheckpointing(500); env.setParallelism(parallelism); env.setRestartStrategy(RestartStrategies.fixedDelayRestart(1, 0)); env.getConfig().disableSysoutLogging(); Properties sourceProps = sourceProperties(); sourceProps.setProperty(TOPIC_MULTI_OPTION_KEY, StringUtils.join(allTopicNames, ',')); env.addSource(new FlinkPulsarRowSource(serviceUrl, adminUrl, sourceProps).setStartFromEarliest()) .map(new PartitionValidationMapper(parallelism, 3)) .map(new FailingIdentityMapper<Row>(failAfterElements)) .addSink(new ValidatingExactlyOnceSink(totalElements)).setParallelism(1); FailingIdentityMapper.failedBefore = false; TestUtils.tryExecute(env, "One-source-multi-partitions exactly once test"); }
Example #8
Source File: FlinkPulsarITest.java From pulsar-flink with Apache License 2.0 | 5 votes |
@Test public void testTaskNumberGreaterThanPartitionNumber() throws Exception { String topic = newTopic(); int numPartitions = 5; int numElementsPerPartition = 1000; int totalElements = numPartitions * numElementsPerPartition; int failAfterElements = numElementsPerPartition / 3; List<String> allTopicNames = new ArrayList<>(); for (int i = 0; i < numPartitions; i++) { allTopicNames.add(topic + "-partition-" + i); } createTopic(topic, numPartitions, adminUrl); generateRandomizedIntegerSequence( StreamExecutionEnvironment.getExecutionEnvironment(), topic, numPartitions, numElementsPerPartition, true); int parallelism = 8; // run the topology that fails and recovers StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment(); env.enableCheckpointing(500); env.setParallelism(parallelism); env.setRestartStrategy(RestartStrategies.fixedDelayRestart(1, 0)); env.getConfig().disableSysoutLogging(); Properties sourceProps = sourceProperties(); sourceProps.setProperty(TOPIC_MULTI_OPTION_KEY, StringUtils.join(allTopicNames, ',')); env.addSource(new FlinkPulsarRowSource(serviceUrl, adminUrl, sourceProps).setStartFromEarliest()) .map(new PartitionValidationMapper(parallelism, 1)) .map(new FailingIdentityMapper<Row>(failAfterElements)) .addSink(new ValidatingExactlyOnceSink(totalElements)).setParallelism(1); FailingIdentityMapper.failedBefore = false; TestUtils.tryExecute(env, "source task number > partition number"); }
Example #9
Source File: KafkaProducerTestBase.java From Flink-CEPplus with Apache License 2.0 | 4 votes |
/** * This test sets KafkaProducer so that it will automatically flush the data and * and fails the broker to check whether flushed records since last checkpoint were not duplicated. */ protected void testExactlyOnce(boolean regularSink, int sinksCount) throws Exception { final String topic = (regularSink ? "exactlyOnceTopicRegularSink" : "exactlyTopicCustomOperator") + sinksCount; final int partition = 0; final int numElements = 1000; final int failAfterElements = 333; for (int i = 0; i < sinksCount; i++) { createTestTopic(topic + i, 1, 1); } TypeInformationSerializationSchema<Integer> schema = new TypeInformationSerializationSchema<>(BasicTypeInfo.INT_TYPE_INFO, new ExecutionConfig()); KeyedSerializationSchema<Integer> keyedSerializationSchema = new KeyedSerializationSchemaWrapper<>(schema); StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment(); env.enableCheckpointing(500); env.setParallelism(1); env.setRestartStrategy(RestartStrategies.fixedDelayRestart(1, 0)); env.getConfig().disableSysoutLogging(); Properties properties = new Properties(); properties.putAll(standardProps); properties.putAll(secureProps); // process exactly failAfterElements number of elements and then shutdown Kafka broker and fail application List<Integer> expectedElements = getIntegersSequence(numElements); DataStream<Integer> inputStream = env .addSource(new IntegerSource(numElements)) .map(new FailingIdentityMapper<Integer>(failAfterElements)); for (int i = 0; i < sinksCount; i++) { FlinkKafkaPartitioner<Integer> partitioner = new FlinkKafkaPartitioner<Integer>() { @Override public int partition(Integer record, byte[] key, byte[] value, String targetTopic, int[] partitions) { return partition; } }; if (regularSink) { StreamSink<Integer> kafkaSink = kafkaServer.getProducerSink(topic + i, keyedSerializationSchema, properties, partitioner); inputStream.addSink(kafkaSink.getUserFunction()); } else { kafkaServer.produceIntoKafka(inputStream, topic + i, keyedSerializationSchema, properties, partitioner); } } FailingIdentityMapper.failedBefore = false; TestUtils.tryExecute(env, "Exactly once test"); for (int i = 0; i < sinksCount; i++) { // assert that before failure we successfully snapshot/flushed all expected elements assertExactlyOnceForTopic( properties, topic + i, partition, expectedElements, KAFKA_READ_TIMEOUT); deleteTestTopic(topic + i); } }
Example #10
Source File: KafkaProducerTestBase.java From flink with Apache License 2.0 | 4 votes |
/** * This test sets KafkaProducer so that it will automatically flush the data and * and fails the broker to check whether flushed records since last checkpoint were not duplicated. */ protected void testExactlyOnce(boolean regularSink, int sinksCount) throws Exception { final String topic = (regularSink ? "exactlyOnceTopicRegularSink" : "exactlyTopicCustomOperator") + sinksCount; final int partition = 0; final int numElements = 1000; final int failAfterElements = 333; for (int i = 0; i < sinksCount; i++) { createTestTopic(topic + i, 1, 1); } TypeInformationSerializationSchema<Integer> schema = new TypeInformationSerializationSchema<>(BasicTypeInfo.INT_TYPE_INFO, new ExecutionConfig()); KeyedSerializationSchema<Integer> keyedSerializationSchema = new KeyedSerializationSchemaWrapper<>(schema); StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment(); env.enableCheckpointing(500); env.setParallelism(1); env.setRestartStrategy(RestartStrategies.fixedDelayRestart(1, 0)); env.getConfig().disableSysoutLogging(); Properties properties = new Properties(); properties.putAll(standardProps); properties.putAll(secureProps); // process exactly failAfterElements number of elements and then shutdown Kafka broker and fail application List<Integer> expectedElements = getIntegersSequence(numElements); DataStream<Integer> inputStream = env .addSource(new IntegerSource(numElements)) .map(new FailingIdentityMapper<Integer>(failAfterElements)); for (int i = 0; i < sinksCount; i++) { FlinkKafkaPartitioner<Integer> partitioner = new FlinkKafkaPartitioner<Integer>() { @Override public int partition(Integer record, byte[] key, byte[] value, String targetTopic, int[] partitions) { return partition; } }; if (regularSink) { StreamSink<Integer> kafkaSink = kafkaServer.getProducerSink(topic + i, keyedSerializationSchema, properties, partitioner); inputStream.addSink(kafkaSink.getUserFunction()); } else { kafkaServer.produceIntoKafka(inputStream, topic + i, keyedSerializationSchema, properties, partitioner); } } FailingIdentityMapper.failedBefore = false; TestUtils.tryExecute(env, "Exactly once test"); for (int i = 0; i < sinksCount; i++) { // assert that before failure we successfully snapshot/flushed all expected elements assertExactlyOnceForTopic( properties, topic + i, partition, expectedElements, KAFKA_READ_TIMEOUT); deleteTestTopic(topic + i); } }
Example #11
Source File: KafkaProducerTestBase.java From flink with Apache License 2.0 | 4 votes |
/** * This test sets KafkaProducer so that it will automatically flush the data and * and fails the broker to check whether flushed records since last checkpoint were not duplicated. */ protected void testExactlyOnce(boolean regularSink, int sinksCount) throws Exception { final String topic = (regularSink ? "exactlyOnceTopicRegularSink" : "exactlyTopicCustomOperator") + sinksCount; final int partition = 0; final int numElements = 1000; final int failAfterElements = 333; for (int i = 0; i < sinksCount; i++) { createTestTopic(topic + i, 1, 1); } TypeInformationSerializationSchema<Integer> schema = new TypeInformationSerializationSchema<>(BasicTypeInfo.INT_TYPE_INFO, new ExecutionConfig()); StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment(); env.enableCheckpointing(500); env.setParallelism(1); env.setRestartStrategy(RestartStrategies.fixedDelayRestart(1, 0)); Properties properties = new Properties(); properties.putAll(standardProps); properties.putAll(secureProps); // process exactly failAfterElements number of elements and then shutdown Kafka broker and fail application List<Integer> expectedElements = getIntegersSequence(numElements); DataStream<Integer> inputStream = env .addSource(new IntegerSource(numElements)) .map(new FailingIdentityMapper<Integer>(failAfterElements)); for (int i = 0; i < sinksCount; i++) { FlinkKafkaPartitioner<Integer> partitioner = new FlinkKafkaPartitioner<Integer>() { @Override public int partition(Integer record, byte[] key, byte[] value, String targetTopic, int[] partitions) { return partition; } }; if (regularSink) { StreamSink<Integer> kafkaSink = kafkaServer.getProducerSink(topic + i, schema, properties, partitioner); inputStream.addSink(kafkaSink.getUserFunction()); } else { kafkaServer.produceIntoKafka(inputStream, topic + i, schema, properties, partitioner); } } FailingIdentityMapper.failedBefore = false; TestUtils.tryExecute(env, "Exactly once test"); for (int i = 0; i < sinksCount; i++) { // assert that before failure we successfully snapshot/flushed all expected elements assertExactlyOnceForTopic( properties, topic + i, partition, expectedElements, KAFKA_READ_TIMEOUT); deleteTestTopic(topic + i); } }