org.apache.flink.streaming.api.datastream.DataStreamSource.addSink java code examples

  private static StreamExecutionEnvironment getSimpleJob() {
    StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment();
    env.generateSequence(1, 10000000)
        .addSink(new SinkFunction<Long>() {
          @Override
          public void invoke(Long value) {
          }
        });

    return env;
  }
}

@SuppressWarnings("unchecked")
private static <T> SourceFunction<T> getFunctionFromDataSource(DataStreamSource<T> dataStreamSource) {
  dataStreamSource.addSink(new DiscardingSink<T>());
  AbstractUdfStreamOperator<?, ?> operator =
      (AbstractUdfStreamOperator<?, ?>) getOperatorFromDataStream(dataStreamSource);
  return (SourceFunction<T>) operator.getUserFunction();
}

public static void main(String[] args) throws Exception {
  final ParameterTool params = ParameterTool.fromArgs(args);
  double errorRate = params.getDouble("error-rate", 0.0);
  int sleep = params.getInt("sleep", 1);
  String kafkaTopic = params.get("kafka-topic");
  String brokers = params.get("brokers", "localhost:9092");
  System.out.printf("Generating events to Kafka with standalone source with error rate %f and sleep delay %s millis\n", errorRate, sleep);
  System.out.println();
  final StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment();
  env
    .addSource(new EventsGeneratorSource(errorRate, sleep))
    .addSink(new FlinkKafkaProducer010<>(brokers, kafkaTopic, new EventDeSerializer()));
  // trigger program execution
  env.execute("State machine example Kafka events generator job");
}

consuming.addSink(new DiscardingSink<String>());

@Override
public void go() throws Exception {
  StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment();
  env.addSource(new SourceFunction<String>() {
    @Override
    public void run(SourceContext<String> ctx) throws Exception {
      sync.block();
    }
    @Override
    public void cancel() {
      sync.releaseBlocker();
    }
  }).addSink(new PrintSinkFunction());
  env.execute();
}

/**
 * Tests whether the Elasticsearch sink fails when there is no cluster to connect to.
 */
public void runInvalidElasticsearchClusterTest() throws Exception {
  final StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment();
  DataStreamSource<Tuple2<Integer, String>> source = env.addSource(new SourceSinkDataTestKit.TestDataSourceFunction());
  Map<String, String> userConfig = new HashMap<>();
  userConfig.put(ElasticsearchSinkBase.CONFIG_KEY_BULK_FLUSH_MAX_ACTIONS, "1");
  userConfig.put("cluster.name", "invalid-cluster-name");
  source.addSink(createElasticsearchSinkForNode(
      1,
      "invalid-cluster-name",
      new SourceSinkDataTestKit.TestElasticsearchSinkFunction("test"),
      "123.123.123.123")); // incorrect ip address
  try {
    env.execute("Elasticsearch Sink Test");
  } catch (JobExecutionException expectedException) {
    // test passes
    return;
  }
  fail();
}

FlinkKafkaConsumerBase<String> source = kafkaServer.getConsumer(topic, new SimpleStringSchema(), props);
env.addSource(source).addSink(new DiscardingSink<String>());

DataStreamSource<Tuple2<Long, byte[]>> consuming = env.addSource(source);
consuming.addSink(new SinkFunction<Tuple2<Long, byte[]>>() {

FlinkKafkaConsumerBase<String> source = kafkaServer.getConsumer(topic, new SimpleStringSchema(), props);
env.addSource(source).addSink(new DiscardingSink<String>());

public static void main(String[] args) throws Exception {
  final ParameterTool pt = ParameterTool.fromArgs(args);
  final StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment();
  setupEnvironment(env, pt);
  final int numStates =
    pt.getInt(NUM_LIST_STATES_PER_OP.key(), NUM_LIST_STATES_PER_OP.defaultValue());
  final int numPartitionsPerState =
    pt.getInt(NUM_PARTITIONS_PER_LIST_STATE.key(), NUM_PARTITIONS_PER_LIST_STATE.defaultValue());
  Preconditions.checkState(env.getCheckpointInterval() > 0L, "Checkpointing must be enabled for this test!");
  env.addSource(new SimpleEndlessSourceWithBloatedState(numStates, numPartitionsPerState)).setParallelism(env.getParallelism())
    .addSink(new DiscardingSink<>()).setParallelism(1);
  env.execute("HeavyDeploymentStressTestProgram");
}

consuming.addSink(new RichSinkFunction<Tuple2<Long, String>>() {

consuming.addSink(new DiscardingSink<String>());

  public void doTestPropagationFromCheckpointConfig(boolean failTaskOnCheckpointErrors) throws Exception {
    StreamExecutionEnvironment streamExecutionEnvironment = StreamExecutionEnvironment.getExecutionEnvironment();
    streamExecutionEnvironment.setParallelism(1);
    streamExecutionEnvironment.getCheckpointConfig().setCheckpointInterval(1000);
    streamExecutionEnvironment.getCheckpointConfig().setFailOnCheckpointingErrors(failTaskOnCheckpointErrors);
    streamExecutionEnvironment.addSource(new SourceFunction<Integer>() {

      @Override
      public void run(SourceContext<Integer> ctx) throws Exception {
      }

      @Override
      public void cancel() {
      }

    }).addSink(new DiscardingSink<>());

    StreamGraph streamGraph = streamExecutionEnvironment.getStreamGraph();
    JobGraph jobGraph = StreamingJobGraphGenerator.createJobGraph(streamGraph);
    SerializedValue<ExecutionConfig> serializedExecutionConfig = jobGraph.getSerializedExecutionConfig();
    ExecutionConfig executionConfig =
      serializedExecutionConfig.deserializeValue(Thread.currentThread().getContextClassLoader());

    Assert.assertEquals(failTaskOnCheckpointErrors, executionConfig.isFailTaskOnCheckpointError());
  }
}

/**
 * Tests that the Elasticsearch sink works properly.
 */
public void runElasticsearchSinkTest() throws Exception {
  final String index = "elasticsearch-sink-test-index";
  final StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment();
  DataStreamSource<Tuple2<Integer, String>> source = env.addSource(new SourceSinkDataTestKit.TestDataSourceFunction());
  source.addSink(createElasticsearchSinkForEmbeddedNode(
      1,
      CLUSTER_NAME,
      new SourceSinkDataTestKit.TestElasticsearchSinkFunction(index)));
  env.execute("Elasticsearch Sink Test");
  // verify the results
  Client client = embeddedNodeEnv.getClient();
  SourceSinkDataTestKit.verifyProducedSinkData(client, index);
  client.close();
}

@Test
@SuppressWarnings("unchecked")
public void testFromCollectionParallelism() {
  try {
    TypeInformation<Integer> typeInfo = BasicTypeInfo.INT_TYPE_INFO;
    StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment();
    DataStreamSource<Integer> dataStream1 = env.fromCollection(new DummySplittableIterator<Integer>(), typeInfo);
    try {
      dataStream1.setParallelism(4);
      fail("should throw an exception");
    }
    catch (IllegalArgumentException e) {
      // expected
    }
    dataStream1.addSink(new DiscardingSink<Integer>());
    DataStreamSource<Integer> dataStream2 = env.fromParallelCollection(new DummySplittableIterator<Integer>(),
        typeInfo).setParallelism(4);
    dataStream2.addSink(new DiscardingSink<Integer>());
    env.getExecutionPlan();
    assertEquals("Parallelism of collection source must be 1.", 1, env.getStreamGraph().getStreamNode(dataStream1.getId()).getParallelism());
    assertEquals("Parallelism of parallel collection source must be 4.",
        4,
        env.getStreamGraph().getStreamNode(dataStream2.getId()).getParallelism());
  }
  catch (Exception e) {
    e.printStackTrace();
    fail(e.getMessage());
  }
}

@Test
public void testSources() {
  StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment();
  SourceFunction<Integer> srcFun = new SourceFunction<Integer>() {
    private static final long serialVersionUID = 1L;
    @Override
    public void run(SourceContext<Integer> ctx) throws Exception {
    }
    @Override
    public void cancel() {
    }
  };
  DataStreamSource<Integer> src1 = env.addSource(srcFun);
  src1.addSink(new DiscardingSink<Integer>());
  assertEquals(srcFun, getFunctionFromDataSource(src1));
  List<Long> list = Arrays.asList(0L, 1L, 2L);
  DataStreamSource<Long> src2 = env.generateSequence(0, 2);
  assertTrue(getFunctionFromDataSource(src2) instanceof StatefulSequenceSource);
  DataStreamSource<Long> src3 = env.fromElements(0L, 1L, 2L);
  assertTrue(getFunctionFromDataSource(src3) instanceof FromElementsFunction);
  DataStreamSource<Long> src4 = env.fromCollection(list);
  assertTrue(getFunctionFromDataSource(src4) instanceof FromElementsFunction);
}

parallelSource.addSink(new DiscardingSink<Long>());
assertEquals(7, env.getStreamGraph().getStreamNode(parallelSource.getId()).getParallelism());

public static void main(String[] args) throws Exception {
  final ParameterTool params = ParameterTool.fromArgs(args);
  double errorRate = params.getDouble("error-rate", 0.0);
  int sleep = params.getInt("sleep", 1);
  String kafkaTopic = params.get("kafka-topic");
  String brokers = params.get("brokers", "localhost:9092");
  System.out.printf("Generating events to Kafka with standalone source with error rate %f and sleep delay %s millis\n", errorRate, sleep);
  System.out.println();
  final StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment();
  env
    .addSource(new EventsGeneratorSource(errorRate, sleep))
    .addSink(new FlinkKafkaProducer010<>(brokers, kafkaTopic, new EventDeSerializer()));
  // trigger program execution
  env.execute("State machine example Kafka events generator job");
}

  public static void main(String[] args) throws Exception{
    final ParameterTool parameterTool = ExecutionEnvUtil.createParameterTool(args);
    StreamExecutionEnvironment env = ExecutionEnvUtil.prepare(parameterTool);
    DataStreamSource<Metrics> data = KafkaConfigUtil.buildSource(env);

    data.addSink(new FlinkKafkaProducer011<Metrics>(
        parameterTool.get("kafka.sink.brokers"),
        parameterTool.get("kafka.sink.topic"),
        new MetricSchema()
        )).name("flink-connectors-kafka")
        .setParallelism(parameterTool.getInt("stream.sink.parallelism"));

    env.execute("flink learning connectors kafka");
  }
}

@Test
public void testSink() throws Exception {
  StreamExecutionEnvironment environment = StreamExecutionEnvironment.getExecutionEnvironment();
  environment.fromElements("string1", "string2")
      .addSink(new FlumeSink<>("172.25.0.3", 44444, new SimpleStringSchema()));
  tryExecute(environment, "FlumeTest");
}

Popular methods of DataStreamSource

Popular in Java

Parsing JSON documents to java classes using gson
getSystemService (Context)
putExtra (Intent)
scheduleAtFixedRate (ScheduledExecutorService)
Timestamp (java.sql)
A Java representation of the SQL TIMESTAMP type. It provides the capability of representing the SQL
Date (java.util)
A specific moment in time, with millisecond precision. Values typically come from System#currentTime
SortedSet (java.util)
SortedSet is a Set which iterates over its elements in a sorted order. The order is determined eithe
AtomicInteger (java.util.concurrent.atomic)
An int value that may be updated atomically. See the java.util.concurrent.atomic package specificati
SSLHandshakeException (javax.net.ssl)
The exception that is thrown when a handshake could not be completed successfully.
LogFactory (org.apache.commons.logging)
Factory for creating Log instances, with discovery and configuration features similar to that employ
CodeWhisperer alternatives

How to use addSinkmethodin org.apache.flink.streaming.api.datastream.DataStreamSource

Best Java code snippets using org.apache.flink.streaming.api.datastream.DataStreamSource.addSink (Showing top 20 results out of 315)

How to use
addSink
method
in
org.apache.flink.streaming.api.datastream.DataStreamSource