public void parse(String rawText) throws ParserRunException { List<String> parserOutput = getParserOutput(rawText); parseParserOutput(parserOutput,rawText); }
/** * @throws ParserRunException * */ public RuleMatcher(String dotDir) throws ParserRunException { parser = new EasyFirstParser("b:/jars/stanford-postagger-2008-09-28/bidirectional-wsj-0-18.tagger"); parser.init(); this.dotDir = dotDir; }
@Override public void setSentence(List<PosTaggedToken> posTaggedSentence) { reset(); this.posTaggedSentence = posTaggedSentence; }
public void f() throws ParserRunException, TreeStringGeneratorException { String posTaggerFile = args[0]; EasyFirstParser parser = new EasyFirstParser(posTaggerFile); parser.init(); try { parser.setSentence("I love you."); parser.parse(); BasicNode tree = parser.getParseTree(); TreeStringGenerator<Info> tsg = new TreeStringGenerator<Info>(new IdLemmaPosRelNodeString(), tree); String treeAsString = tsg.generateString(); System.out.println(treeAsString); } finally { parser.cleanUp(); } }
private static EnglishSingleTreeParser getParserEasyFirst(String host, Integer port, String stanfordPosTaggerModuleFileName) throws ParserRunException, TeEngineMlException { if (null==stanfordPosTaggerModuleFileName)throw new TeEngineMlException("Null stanfordPosTaggerModuleFileName"); EnglishSingleTreeParser ret = null; if ( (null==host) && (null==port) ) ret = new EasyFirstParser(stanfordPosTaggerModuleFileName); else { if (null==host)host="localhost"; if (null==port)port=EasyFirstParser.DEFAULT_PORT; ret = new EasyFirstParser(host, port, stanfordPosTaggerModuleFileName); } return ret; }
private ExtendedNode annotateSentece(String sentence) throws ConllConverterException { parser.setSentence(sentence); ExtendedNode annotatedSentece; try { parser.parse(); BasicNode parsedTree = parser.getParseTree(); ExtendedNode extendedTree = TreeUtilities.copyFromBasicNode(parsedTree); annotator.setTree(extendedTree); annotator.annotate(); annotatedSentece = annotator.getAnnotatedTree(); } catch (Exception e) { throw new ConllConverterException("see nested", e); } return annotatedSentece; }
client = new EasyFirstClient(tokenizer, posTagger, url); client.parse(sentence); client = new EasyFirstClient(url); client.parse(this.posTaggedSentence); nodesList = client.getNodesAsList(); mutableTree = client.getTree(); wordsNodesList = client.getWordsNodesList();
public void parse(List<PosTaggedToken> posTaggedSentence) throws ParserRunException { String taggedText = fixPosTaggedTokensAndConvertToString(posTaggedSentence); try { List<String> parserOutput = getParserOutputFromPosTaggedText(taggedText); parseParserOutput(parserOutput,null); } catch (IOException e) { throw new ParserRunException("Failed to run parser.\n*** Please make sure that the EasyFirst parser server is running, and listening on: "+parserUrl+"\nInput was the following tagger text:\n"+taggedText+"\nPlease see nested exception",e); } }
/** * Get some raw text and return parsed text * @param rawText each sentence is a line, and will produce several parses if you give it several lines * @return * @throws ParserRunException */ private List<String> getParserOutput(String rawText) throws ParserRunException { List<String> ret = null; try { List<PosTaggedToken> posTaggedTokensForRawText = tokenizeAndPosTag(rawText); String taggedText = fixPosTaggedTokensAndConvertToString(posTaggedTokensForRawText); ret = getParserOutputFromPosTaggedText(taggedText); } catch (IOException e) { throw new ParserRunException("Error openning a new URLConnection, or writing to or reading from the parser server", e); } finally { } return ret; }
private String fixPosTaggedTokensAndConvertToString(List<PosTaggedToken> posTaggedTokens) { return posTaggedTokensToString(inspectPosTaggedTokens(posTaggedTokens)); }
public static void main(String[] args) { try { DemoEasyFirst app = new DemoEasyFirst(args); app.f(); } catch(Exception e) { e.printStackTrace(System.out); } }
public void init() throws ParserRunException { if ( (this.tokenizer!=null) && (this.posTagger!=null) ) { initTokenizerAndPosTagger(); } else if ( (null==this.tokenizer) && (null==this.posTagger) ) { // do nothing } else throw new ParserRunException("Tokenizer and Pos-Tagger must be" + "either both null, or both non-null."); initialized=true; }
@Override protected EasyFirstParser buildInnerTool() throws Exception { EasyFirstParser parser = new EasyFirstParser(host, port); parser.init(); return parser; } }
/** * @return a new initialized instance of our standard parser. * Currently returns an EasyFirst parser on port 8081, * with A POStagger and tokenizer it gets. * @throws ParserRunException if the parser cannot be initialized. */ public static EnglishSingleTreeParser getInitializedStandardParser(PosTagger posTagger, Tokenizer tokenizer, String parserHost, int parserPort ) throws ParserRunException { EnglishSingleTreeParser parser = new EasyFirstParser(parserHost, parserPort, tokenizer, posTagger); initAndCheckParser(parser, parserHost, parserPort); return parser; } }
public void setSentence(String sentence) { reset(); this.sentence = sentence; }
/** * Ctor * * @param posTaggerModelFile e.g. "b:/jars/stanford-postagger-2008-09-28/bidirectional-wsj-0-18.tagger" * @throws JwktlException */ public WktGlossParser(String posTaggerModelFile) throws JwktlException { try { parser = new EasyFirstParser(posTaggerModelFile ); parser.init(); } catch (ParserRunException e) { throw new JwktlException("could not init the parser", e); } try { posTagger = new MaxentPosTagger(posTaggerModelFile); posTagger.init(); } catch (PosTaggerException e) { throw new JwktlException("POS tagger error", e); } }
/** * @return a new initialized instance of a parser, to be used for testing the dependency paths classes. * Currently returns an EasyFirst parser on port 8081, * with Stanford POS tagger. * @throws ParserRunException if the parser cannot be initialized. */ public static BasicParser defaultParserForTesting() throws ParserRunException { final String DEFAULT_PARSER_HOST = "te-srv1"; final int DEFAULT_PARSER_PORT = 8081; final String POS_TAGGER_MODEL = System.getenv("JARS")+"/stanford-postagger-full-2008-09-28/models/bidirectional-wsj-0-18.tagger"; BasicParser parser = new EasyFirstParser(DEFAULT_PARSER_HOST, DEFAULT_PARSER_PORT, POS_TAGGER_MODEL); String TEST_SENTENCE = "And there was light"; // just to test that the parser is active. try { parser.init(); parser.setSentence(TEST_SENTENCE); parser.parse(); // test that the parser is active } catch (ParserRunException ex) { throw new ParserRunException( "Cannot get a working EasyFirst parser! Please check that: \n"+ " A. EasyFirst server is listening on host "+DEFAULT_PARSER_HOST+", port "+DEFAULT_PARSER_PORT+". If it is not, run:\n"+ "\tpython "+System.getenv("JARS")+"/easyfirst/biu_distrib_09072011/sdparser_server.py "+DEFAULT_PARSER_PORT+"\n" + " B. There is a POS tagger model at "+POS_TAGGER_MODEL); } return parser; }
/** * Ctor * @throws ConfigurationException * @throws ConllConverterException */ public AnnotateSentenceToConll(ConfigurationFile confFile) throws ConfigurationException, ConllConverterException { confFile.setExpandingEnvironmentVariables(true); annotationParams = confFile.getModuleConfiguration(TransformationsConfigurationParametersNames.TRUTH_TELLER_MODULE_NAME); try { annotator = new DefaultSentenceAnnotator(annotationParams); String posTaggerString = annotationParams.get(TransformationsConfigurationParametersNames.PREPROCESS_EASYFIRST); String easyFirstHost = annotationParams.get(TransformationsConfigurationParametersNames.PREPROCESS_EASYFIRST_HOST); int easyFirstPort = annotationParams.getInt(TransformationsConfigurationParametersNames.PREPROCESS_EASYFIRST_PORT); parser = new EasyFirstParser(easyFirstHost, easyFirstPort, posTaggerString); parser.init(); } catch (Exception e) { throw new ConllConverterException("see nested", e); } String conllOutputFolderPath = annotationParams.get(TransformationsConfigurationParametersNames.CONLL_FORMAT_OUTPUT_DIRECTORY); conllOutputFolder = new File(conllOutputFolderPath); conllOutputFolder.mkdirs(); }
public BiuTreeBuilder() throws TokenizerException, PosTaggerException, NamedEntityRecognizerException, ParserRunException { splitter = new LingPipeSentenceSplitter(); tokenizer = new MaxentTokenizer(); tagger = new MaxentPosTagger(BiuTestParams.MAXENT_POS_TAGGER_MODEL_FILE); ner = new StanfordNamedEntityRecognizer(new File(BiuTestParams.STANFORD_NER_CLASSIFIER_PATH)); parser = new EasyFirstParser( BiuTestParams.EASYFIRST_HOST, BiuTestParams.EASYFIRST_PORT, tokenizer, tagger ); ner.init(); parser.init(); }
BasicParser parser = new EasyFirstParser(args[0], Integer.parseInt(args[1]), args[2]); parser.init();