org.apache.flink.api.java.operators.MapOperator.filter java code examples

.filter(new FilterFunction<Integer>() {
  @Override
  public boolean filter(Integer value) {

.filter(new FilterFunction<Integer>() {
  @Override
  public boolean filter(Integer value) {

/**
 * Tests cross program with replicated data source behind map and filter.
 */
@Test
public void checkCrossWithReplicatedSourceInputBehindMap() {
  ExecutionEnvironment env = ExecutionEnvironment.createLocalEnvironment();
  env.setParallelism(DEFAULT_PARALLELISM);
  TupleTypeInfo<Tuple1<String>> typeInfo = TupleTypeInfo.getBasicTupleTypeInfo(String.class);
  ReplicatingInputFormat<Tuple1<String>, FileInputSplit> rif =
      new ReplicatingInputFormat<Tuple1<String>, FileInputSplit>(new TupleCsvInputFormat<Tuple1<String>>(new Path("/some/path"), typeInfo));
  DataSet<Tuple1<String>> source1 = env.createInput(rif, new TupleTypeInfo<Tuple1<String>>(BasicTypeInfo.STRING_TYPE_INFO));
  DataSet<Tuple1<String>> source2 = env.readCsvFile("/some/otherpath").types(String.class);
  DataSink<Tuple2<Tuple1<String>, Tuple1<String>>> out = source1
      .map(new IdMap())
      .filter(new NoFilter())
      .cross(source2)
      .writeAsText("/some/newpath");
  Plan plan = env.createProgramPlan();
  // submit the plan to the compiler
  OptimizedPlan oPlan = compileNoStats(plan);
  // check the optimized Plan
  // when cross should have forward strategy on both sides
  SinkPlanNode sinkNode = oPlan.getDataSinks().iterator().next();
  DualInputPlanNode crossNode = (DualInputPlanNode) sinkNode.getPredecessor();
  ShipStrategyType crossIn1 = crossNode.getInput1().getShipStrategy();
  ShipStrategyType crossIn2 = crossNode.getInput2().getShipStrategy();
  Assert.assertEquals("Invalid ship strategy for an operator.", ShipStrategyType.FORWARD, crossIn1);
  Assert.assertEquals("Invalid ship strategy for an operator.", ShipStrategyType.FORWARD, crossIn2);
}

@Override
public DataSet<GraphHead> getGraphHeads() {
 return transactions
  .map(new TransactionGraphHead<>())
  .filter(new ByDifferentId<>(GradoopConstants.DB_GRAPH_ID));
}

@Override
public DataSet<GraphHead> getGraphHeads() {
 return transactions
  .map(new TransactionGraphHead<>())
  .filter(new ByDifferentId<>(GradoopConstants.DB_GRAPH_ID));
}

static DataSet<Tuple2<Long, String>> getHdfsSource(ExecutionEnvironment env, URI inputPath)
throws IOException {
 SearchEventsParser parser = new SearchEventsParser();
 return env.readFile(new TextInputFormat(new Path(inputPath)), inputPath.toString())
     .map(parser::parse)
     .filter(q -> q != null && q.query != null && !q.query.isEmpty())
     .map(q -> Tuple2.of(q.timestamp, q.query))
     .returns(new TypeHint<Tuple2<Long, String>>() {});
}

 .map(new CSVLineToGraphHead(graphHeadFactory))
 .withBroadcastSet(metaDataBroadcast, BC_METADATA)
 .filter(graphHead -> graphHead.getLabel().equals(label))))
.collect(Collectors.toMap(t -> t.f0, t -> t.f1));
 .map(new CSVLineToVertex(vertexFactory))
 .withBroadcastSet(metaDataBroadcast, BC_METADATA)
 .filter(vertex -> vertex.getLabel().equals(label))))
.collect(Collectors.toMap(t -> t.f0, t -> t.f1));
 .map(new CSVLineToEdge(edgeFactory))
 .withBroadcastSet(metaDataBroadcast, BC_METADATA)
 .filter(edge -> edge.getLabel().equals(label))))
.collect(Collectors.toMap(t -> t.f0, t -> t.f1));

 .map(new CSVLineToGraphHead(graphHeadFactory))
 .withBroadcastSet(metaDataBroadcast, BC_METADATA)
 .filter(graphHead -> graphHead.getLabel().equals(label))))
.collect(Collectors.toMap(t -> t.f0, t -> t.f1));
 .map(new CSVLineToVertex(vertexFactory))
 .withBroadcastSet(metaDataBroadcast, BC_METADATA)
 .filter(vertex -> vertex.getLabel().equals(label))))
.collect(Collectors.toMap(t -> t.f0, t -> t.f1));
 .map(new CSVLineToEdge(edgeFactory))
 .withBroadcastSet(metaDataBroadcast, BC_METADATA)
 .filter(edge -> edge.getLabel().equals(label))))
.collect(Collectors.toMap(t -> t.f0, t -> t.f1));

graphs.map(new HasEmbeddings(
 new DepthSearchMatching(), queryString))
 .filter(new SecondFieldTrue<>());

.map(new GrowFrequentPatterns(gSpan, fsmConfig))
.withBroadcastSet(frequentPatterns, DIMSpanConstants.FREQUENT_PATTERNS)
.filter(new NotObsolete());

.map(new GrowFrequentPatterns(gSpan, fsmConfig))
.withBroadcastSet(frequentPatterns, DIMSpanConstants.FREQUENT_PATTERNS)
.filter(new NotObsolete());

public static void main(String[] args) throws Exception {
  // parse parameters
  ParameterTool params = ParameterTool.fromArgs(args);
  String input = params.getRequired("input");
  // obtain an execution environment
  ExecutionEnvironment env = ExecutionEnvironment.getExecutionEnvironment();
  // read messageId, sender, and reply-to fields from the input data set
  DataSet<Tuple3<String, String, String>> mails =
      env.readCsvFile(input)
          .lineDelimiter(MBoxParser.MAIL_RECORD_DELIM)
          .fieldDelimiter(MBoxParser.MAIL_FIELD_DELIM)
          // messageId at position 0, sender at 2, reply-to at 5
          .includeFields("101001")
          .types(String.class, String.class, String.class);
  // extract email addresses and filter out mails from bots
  DataSet<Tuple3<String, String, String>> addressMails = mails
      .map(new EmailExtractor())
      .filter(new ExcludeEmailFilter("git@git.apache.org"))
      .filter(new ExcludeEmailFilter("jira@apache.org"));
  // construct reply connections by joining on messageId and reply-To
  DataSet<Tuple2<String, String>> replyConnections = addressMails
      .join(addressMails).where(2).equalTo(0).projectFirst(1).projectSecond(1);
  // count reply connections for each pair of email addresses
  replyConnections
      .groupBy(0, 1).reduceGroup(new ConnectionCounter())
      .print();
}

Popular methods of MapOperator

Popular in Java

Updating database using SQL prepared statement
getContentResolver (Context)
getApplicationContext (Context)
putExtra (Intent)
ArrayList (java.util)
ArrayList is an implementation of List, backed by an array. All optional operations including adding
ReentrantLock (java.util.concurrent.locks)
A reentrant mutual exclusion Lock with the same basic behavior and semantics as the implicit monitor
HttpServlet (javax.servlet.http)
Provides an abstract class to be subclassed to create an HTTP servlet suitable for a Web site. A sub
DataSource (javax.sql)
An interface for the creation of Connection objects which represent a connection to a database. This
Logger (org.slf4j)
The org.slf4j.Logger interface is the main user entry point of SLF4J API. It is expected that loggin
Color (java.awt)
The Color class is used to encapsulate colors in the default sRGB color space or colors in arbitrary
Github Copilot alternatives

How to use filtermethodin org.apache.flink.api.java.operators.MapOperator

Best Java code snippets using org.apache.flink.api.java.operators.MapOperator.filter (Showing top 12 results out of 315)

How to use
filter
method
in
org.apache.flink.api.java.operators.MapOperator