org.apache.flink.streaming.api.datastream.DataStream.print java code examples

/**
 * A thin wrapper layer over {@link DataStream#print()}.
 */
@PublicEvolving
public void output() {
  stream.print();
}

private static Integer createDownStreamId(DataStream<?> dataStream) {
  return dataStream.print().getTransformation().getId();
}

public static void main(String[] args) throws Exception {
  // parse the parameters
  final ParameterTool params = ParameterTool.fromArgs(args);
  final long windowSize = params.getLong("windowSize", 2000);
  final long rate = params.getLong("rate", 3L);
  System.out.println("Using windowSize=" + windowSize + ", data rate=" + rate);
  System.out.println("To customize example, use: WindowJoin [--windowSize <window-size-in-millis>] [--rate <elements-per-second>]");
  // obtain execution environment, run this example in "ingestion time"
  StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment();
  env.setStreamTimeCharacteristic(TimeCharacteristic.IngestionTime);
  // make parameters available in the web interface
  env.getConfig().setGlobalJobParameters(params);
  // create the data sources for both grades and salaries
  DataStream<Tuple2<String, Integer>> grades = GradeSource.getSource(env, rate);
  DataStream<Tuple2<String, Integer>> salaries = SalarySource.getSource(env, rate);
  // run the actual window join program
  // for testability, this functionality is in a separate method.
  DataStream<Tuple3<String, Integer, Integer>> joinedStream = runWindowJoin(grades, salaries, windowSize);
  // print the results with a single thread, rather than in parallel
  joinedStream.print().setParallelism(1);
  // execute program
  env.execute("Windowed Join Example");
}

} else {
  System.out.println("Printing result to stdout. Use --output to specify output path.");
  aggregated.print();

public static void main(String[] args) throws Exception {
  // set up execution environment
  StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment();
  StreamTableEnvironment tEnv = TableEnvironment.getTableEnvironment(env);
  DataStream<Order> orderA = env.fromCollection(Arrays.asList(
    new Order(1L, "beer", 3),
    new Order(1L, "diaper", 4),
    new Order(3L, "rubber", 2)));
  DataStream<Order> orderB = env.fromCollection(Arrays.asList(
    new Order(2L, "pen", 3),
    new Order(2L, "rubber", 3),
    new Order(4L, "beer", 1)));
  // convert DataStream to Table
  Table tableA = tEnv.fromDataStream(orderA, "user, product, amount");
  // register DataStream as Table
  tEnv.registerDataStream("OrderB", orderB, "user, product, amount");
  // union the two tables
  Table result = tEnv.sqlQuery("SELECT * FROM " + tableA + " WHERE amount > 2 UNION ALL " +
          "SELECT * FROM OrderB WHERE amount < 2");
  tEnv.toAppendStream(result, Order.class).print();
  env.execute();
}

} else {
  System.out.println("Printing result to stdout. Use --output to specify output path.");
  counts.print();

} else {
  System.out.println("Printing result to stdout. Use --output to specify output path.");
  counts.print();

@Test(expected = UnsupportedOperationException.class)
public void testIncorrectParallelism() throws Exception {
  StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment();
  DataStream<Integer> source = env.fromElements(1, 10);
  IterativeStream<Integer> iter1 = source.iterate();
  SingleOutputStreamOperator<Integer> map1 = iter1.map(noOpIntMap);
  iter1.closeWith(map1).print();
}

} else {
  System.out.println("Printing result to stdout. Use --output to specify output path.");
  tweets.print();

  FlinkKafkaConsumerBase<String> source = kafkaServer.getConsumer("doesntexist", new SimpleStringSchema(), properties);
  DataStream<String> stream = see.addSource(source);
  stream.print();
  see.execute("No broker test");
} catch (JobExecutionException jee) {

} else {
  System.out.println("Printing result to stdout. Use --output to specify output path.");
  counts.print();
  rejectedWords.print();

@Test
public void testImmutabilityWithCoiteration() {
  StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment();
  DataStream<Integer> source = env.fromElements(1, 10).map(noOpIntMap); // for rebalance
  IterativeStream<Integer> iter1 = source.iterate();
  // Calling withFeedbackType should create a new iteration
  ConnectedIterativeStreams<Integer, String> iter2 = iter1.withFeedbackType(String.class);
  iter1.closeWith(iter1.map(noOpIntMap)).print();
  iter2.closeWith(iter2.map(noOpCoMap)).print();
  StreamGraph graph = env.getStreamGraph();
  assertEquals(2, graph.getIterationSourceSinkPairs().size());
  for (Tuple2<StreamNode, StreamNode> sourceSinkPair: graph.getIterationSourceSinkPairs()) {
    assertEquals(graph.getTargetVertex(sourceSinkPair.f0.getOutEdges().get(0)),
      graph.getSourceVertex(sourceSinkPair.f1.getInEdges().get(0)));
  }
}

public static void main(String[] args) throws Exception {
  // Checking input parameters
  final ParameterTool params = ParameterTool.fromArgs(args);
  StreamExecutionEnvironment env = StreamExecutionEnvironment.getExecutionEnvironment();
  env.setStreamTimeCharacteristic(TimeCharacteristic.EventTime);
  DataStream<Integer> trainingData = env.addSource(new FiniteTrainingDataSource());
  DataStream<Integer> newData = env.addSource(new FiniteNewDataSource());
  // build new model on every second of new data
  DataStream<Double[]> model = trainingData
      .assignTimestampsAndWatermarks(new LinearTimestamp())
      .timeWindowAll(Time.of(5000, TimeUnit.MILLISECONDS))
      .apply(new PartialModelBuilder());
  // use partial model for newData
  DataStream<Integer> prediction = newData.connect(model).map(new Predictor());
  // emit result
  if (params.has("output")) {
    prediction.writeAsText(params.get("output"));
  } else {
    System.out.println("Printing result to stdout. Use --output to specify output path.");
    prediction.print();
  }
  // execute program
  env.execute("Streaming Incremental Learning");
}

windowCounts.print().setParallelism(1);

} else {
  System.out.println("Printing result to stdout. Use --output to specify output path.");
  numbers.print();

DataStreamSink<Long> broadcastSink = broadcast.print();
StreamPartitioner<?> broadcastPartitioner =
    env.getStreamGraph().getStreamEdges(src.getId(),
DataStreamSink<Long> shuffleSink = shuffle.print();
StreamPartitioner<?> shufflePartitioner =
    env.getStreamGraph().getStreamEdges(src.getId(),
DataStreamSink<Long> forwardSink = forward.print();
StreamPartitioner<?> forwardPartitioner =
    env.getStreamGraph().getStreamEdges(src.getId(),
DataStreamSink<Long> rebalanceSink = rebalance.print();
StreamPartitioner<?> rebalancePartitioner =
    env.getStreamGraph().getStreamEdges(src.getId(),
DataStreamSink<Long> globalSink = global.print();
StreamPartitioner<?> globalPartitioner =
    env.getStreamGraph().getStreamEdges(src.getId(),

} else {
  System.out.println("Printing result to stdout. Use --output to specify output path.");
  topSpeeds.print();

@Test
public void testNestedPojoFieldAccessor() throws Exception {
  StreamExecutionEnvironment see = StreamExecutionEnvironment.getExecutionEnvironment();
  see.getConfig().disableObjectReuse();
  see.setParallelism(4);
  DataStream<Data> dataStream = see.fromCollection(elements);
  DataStream<Data> summedStream = dataStream
    .keyBy("aaa")
    .sum("stats.count")
    .keyBy("aaa")
    .flatMap(new FlatMapFunction<Data, Data>() {
      Data[] first = new Data[3];
      @Override
      public void flatMap(Data value, Collector<Data> out) throws Exception {
        if (first[value.aaa] == null) {
          first[value.aaa] = value;
          if (value.stats.count != 123) {
            throw new RuntimeException("Expected stats.count to be 123");
          }
        } else {
          if (value.stats.count != 2 * 123) {
            throw new RuntimeException("Expected stats.count to be 2 * 123");
          }
        }
      }
    });
  summedStream.print();
  see.execute();
}

summedStream.print();

summedStream.print();

Javadoc

Writes a DataStream to the standard output stream (stdout).

For each element of the DataStream the result of Object#toString() is written.

NOTE: This will print to stdout on the machine where the code is executed, i.e. the Flink worker.

Popular methods of DataStream

addSink
Adds the given sink to this DataStream. Only streams with sinks added will be executed once the Stre
keyBy
Partitions the operator state of a DataStream using field expressions. A field expression is either
map
Applies a Map transformation on a DataStream. The transformation calls a MapFunction for each elemen
flatMap
Applies a FlatMap transformation on a DataStream. The transformation calls a FlatMapFunction for eac
getType
Gets the type of the stream.
union
Creates a new DataStream by merging DataStream outputs of the same type with each other. The DataStr
transform
Method for passing user defined operators along with the type information that will transform the Da
getExecutionEnvironment
Returns the StreamExecutionEnvironment that was used to create this DataStream.
getTransformation
Returns the StreamTransformation that represents the operation that logically creates this DataStrea
rebalance
Sets the partitioning of the DataStream so that the output elements are distributed evenly to instan
writeAsText
Writes a DataStream to the file specified by path in text format.For every element of the DataStream
broadcast
Sets the partitioning of the DataStream so that the output elements are broadcasted to every paralle

Popular in Java

Running tasks concurrently on multiple threads
startActivity (Activity)
getSystemService (Context)
addToBackStack (FragmentTransaction)
Options (org.apache.commons.cli)
Main entry-point into the library. Options represents a collection of Option objects, which describ
Logger (org.apache.log4j)
This is the central class in the log4j package. Most logging operations, except configuration, are d
Logger (org.slf4j)
The org.slf4j.Logger interface is the main user entry point of SLF4J API. It is expected that loggin
Notification (javax.management)
Table (org.hibernate.mapping)
A relational table
Scheduler (org.quartz)
This is the main interface of a Quartz Scheduler. A Scheduler maintains a registry of org.quartz.Job
Best IntelliJ plugins

How to use printmethodin org.apache.flink.streaming.api.datastream.DataStream

Best Java code snippets using org.apache.flink.streaming.api.datastream.DataStream.print (Showing top 20 results out of 315)

How to use
print
method
in
org.apache.flink.streaming.api.datastream.DataStream