public String toString() { StringBuilder str = new StringBuilder(); boolean foundCommon = false; for (ConllDependencyNode node : this) { if (isCommonNode(node)) { foundCommon = true; str.append( L_TOK_DELIM + node.getForm() + R_TOK_DELIM ); str.append( L_POS_DELIM + node.getPostag() + R_POS_DELIM ); continue; } str.append( foundCommon ? DN_ARC_A + L_REL_DELIM + node.getDeprel() + R_REL_DELIM + DN_ARC_B + L_TOK_DELIM + node.getForm() + R_TOK_DELIM + L_POS_DELIM + node.getPostag() + R_POS_DELIM : L_TOK_DELIM + node.getForm() + R_TOK_DELIM + L_POS_DELIM + node.getPostag() + R_POS_DELIM + UP_ARC_B + L_REL_DELIM + node.getDeprel() + R_REL_DELIM + UP_ARC_A ); } return str.toString(); }
public String toString() { StringBuilder str = new StringBuilder(); boolean foundCommon = false; for (ConllDependencyNode node : this) { if (isCommonNode(node)) { foundCommon = true; str.append( L_TOK_DELIM + node.getForm() + R_TOK_DELIM ); str.append( L_POS_DELIM + node.getPostag() + R_POS_DELIM ); continue; } str.append( foundCommon ? DN_ARC_A + L_REL_DELIM + node.getDeprel() + R_REL_DELIM + DN_ARC_B + L_TOK_DELIM + node.getForm() + R_TOK_DELIM + L_POS_DELIM + node.getPostag() + R_POS_DELIM : L_TOK_DELIM + node.getForm() + R_TOK_DELIM + L_POS_DELIM + node.getPostag() + R_POS_DELIM + UP_ARC_B + L_REL_DELIM + node.getDeprel() + R_REL_DELIM + UP_ARC_A ); } return str.toString(); }
if (regnodes[i].getForm()==null) regnodes[i].setForm(ANY_TOKEN); if (regnodes[i].getPostag()==null) regnodes[i].setPostag(ANY_POS); if (regnodes[i].getDeprel()==null) regnodes[i].setDeprel(ANY_DEPREL); if (i==commonNodeIndex-1) { str.append( L_TOK_DELIM + regnodes[i].getForm() + R_TOK_DELIM ); str.append( L_POS_DELIM + regnodes[i].getPostag() + R_POS_DELIM ); continue; + L_REL_DELIM + regnodes[i].getDeprel() + R_REL_DELIM + DN_ARC_B + L_TOK_DELIM + regnodes[i].getForm() + R_TOK_DELIM + L_POS_DELIM + regnodes[i].getPostag() + R_POS_DELIM L_TOK_DELIM + regnodes[i].getForm() + R_TOK_DELIM + L_POS_DELIM + regnodes[i].getPostag() + R_POS_DELIM + UP_ARC_B
if (regnodes[i].getForm()==null) regnodes[i].setForm(ANY_TOKEN); if (regnodes[i].getPostag()==null) regnodes[i].setPostag(ANY_POS); if (regnodes[i].getDeprel()==null) regnodes[i].setDeprel(ANY_DEPREL); if (i==commonNodeIndex-1) { str.append( L_TOK_DELIM + regnodes[i].getForm() + R_TOK_DELIM ); str.append( L_POS_DELIM + regnodes[i].getPostag() + R_POS_DELIM ); continue; + L_REL_DELIM + regnodes[i].getDeprel() + R_REL_DELIM + DN_ARC_B + L_TOK_DELIM + regnodes[i].getForm() + R_TOK_DELIM + L_POS_DELIM + regnodes[i].getPostag() + R_POS_DELIM L_TOK_DELIM + regnodes[i].getForm() + R_TOK_DELIM + L_POS_DELIM + regnodes[i].getPostag() + R_POS_DELIM + UP_ARC_B
L_TOK_DELIM + node.getHead().getForm() + R_TOK_DELIM + L_POS_DELIM + node.getHead().getPostag() + R_POS_DELIM + DN_ARC_A + L_REL_DELIM + node.getDeprel() + R_REL_DELIM + DN_ARC_B + L_TOK_DELIM + node.getForm() + R_TOK_DELIM + L_POS_DELIM + node.getPostag() + R_POS_DELIM L_TOK_DELIM + node.getForm() + R_TOK_DELIM + L_POS_DELIM + node.getPostag() + R_POS_DELIM + UP_ARC_B + L_REL_DELIM + node.getDeprel() + R_REL_DELIM + UP_ARC_A + L_TOK_DELIM + node.getHead().getForm() + R_TOK_DELIM + L_POS_DELIM + node.getHead().getPostag() + R_POS_DELIM
L_TOK_DELIM + node.getHead().getForm() + R_TOK_DELIM + L_POS_DELIM + node.getHead().getPostag() + R_POS_DELIM + DN_ARC_A + L_REL_DELIM + node.getDeprel() + R_REL_DELIM + DN_ARC_B + L_TOK_DELIM + node.getForm() + R_TOK_DELIM + L_POS_DELIM + node.getPostag() + R_POS_DELIM L_TOK_DELIM + node.getForm() + R_TOK_DELIM + L_POS_DELIM + node.getPostag() + R_POS_DELIM + UP_ARC_B + L_REL_DELIM + node.getDeprel() + R_REL_DELIM + UP_ARC_A + L_TOK_DELIM + node.getHead().getForm() + R_TOK_DELIM + L_POS_DELIM + node.getHead().getPostag() + R_POS_DELIM
bw.write( node.getForm() + "\t" ); bw.write( (node.getHead() == null ? "_" : node.getHead().getId()) + "\t" ); bw.write( node.getDeprel() + "\n" ); } else if ( iv_outputFormat.toLowerCase().contains( "mpos" ) ) { bw.write( node.getId() + "\t" ); bw.write( node.getForm() + "\t" ); bw.write( node.getPostag() + "\t" ); bw.write( (node.getHead() == null ? "_" : node.getHead().getId()) + "\t" ); } else if ( iv_outputFormat.toLowerCase().contains( "mlem" ) ) { bw.write( node.getId() + "\t" ); bw.write( node.getForm() + "\t" ); bw.write( node.getLemma() + "\t" ); bw.write( (node.getHead() == null ? "_" : node.getHead().getId()) + "\t" ); } else if ( iv_outputFormat.toLowerCase().contains( "dep" ) ) { bw.write( node.getId() + "\t" ); bw.write( node.getForm() + "\t" ); bw.write( node.getLemma() + "\t" ); bw.write( node.getPostag() + "\t" ); } else { //if (iv_outputFormat.toLowerCase().contains("conll")) { bw.write( node.getId() + "\t" ); bw.write( node.getForm() + "\t" ); bw.write( node.getLemma() + "\t" ); bw.write( node.getCpostag() + "\t" );
bw.write( node.getForm() + "\t" ); bw.write( (node.getHead() == null ? "_" : node.getHead().getId()) + "\t" ); bw.write( node.getDeprel() + "\n" ); } else if ( iv_outputFormat.toLowerCase().contains( "mpos" ) ) { bw.write( node.getId() + "\t" ); bw.write( node.getForm() + "\t" ); bw.write( node.getPostag() + "\t" ); bw.write( (node.getHead() == null ? "_" : node.getHead().getId()) + "\t" ); } else if ( iv_outputFormat.toLowerCase().contains( "mlem" ) ) { bw.write( node.getId() + "\t" ); bw.write( node.getForm() + "\t" ); bw.write( node.getLemma() + "\t" ); bw.write( (node.getHead() == null ? "_" : node.getHead().getId()) + "\t" ); } else if ( iv_outputFormat.toLowerCase().contains( "dep" ) ) { bw.write( node.getId() + "\t" ); bw.write( node.getForm() + "\t" ); bw.write( node.getLemma() + "\t" ); bw.write( node.getPostag() + "\t" ); } else { //if (iv_outputFormat.toLowerCase().contains("conll")) { bw.write( node.getId() + "\t" ); bw.write( node.getForm() + "\t" ); bw.write( node.getLemma() + "\t" ); bw.write( node.getCpostag() + "\t" );
String nodeText = node.getCoveredText(); if(node.getForm().matches("\\s+")) return null;
String form = casDepNode.getForm(); String pos = casDepNode.getPostag(); String lemma = casDepNode.getLemma();
String form = casDepNode.getForm(); String pos = casDepNode.getPostag(); String lemma = casDepNode.getLemma();
if(node.getForm().matches("\\s+")) continue;