public void tagSentence(List<Word> sentenceWords) { NLPNode[] decodedNodes = nlpDecoder.decode(toNodeArray(sentenceWords)); for(int i = 0; i < sentenceWords.size(); i++) { Word word = sentenceWords.get(i); word.setNerLabel(decodedNodes[i + 1].getNamedEntityTag().replace("U-", "B-").replace("L-", "I-")); } }
static public void main(String[] args) throws Exception { final String configFile = "src/main/resources/edu/emory/mathcs/nlp/configuration/config-decode-en.xml"; final String inputFile = "src/test/resources/dat/nlp4j.txt"; NLPDecoder nlp4j = new NLPDecoder(IOUtils.createFileInputStream(configFile)); NLPNode[] nodes; String sentence = "John bought a car for Mary."; nodes = nlp4j.decode(sentence); System.out.println(Joiner.join(nodes, "\n", 1)+"\n"); nlp4j.decode(IOUtils.createFileInputStream(inputFile), System.out, AbstractNLPDecoder.FORMAT_RAW); } }
static public void main(String[] args) throws Exception { final String configFile = "src/main/resources/edu/emory/mathcs/nlp/configuration/config-decode-en.xml"; final String inputFile = "src/test/resources/dat/nlp4j.txt"; NLPDecoder nlp4j = new NLPDecoder(IOUtils.createFileInputStream(configFile)); NLPNode[] nodes; String sentence = "John bought a car for Mary."; nodes = nlp4j.decode(sentence); System.out.println(Joiner.join(nodes, "\n", 1)+"\n"); nlp4j.decode(IOUtils.createFileInputStream(inputFile), System.out, AbstractNLPDecoder.FORMAT_RAW); } }
public NLPDecode(String[] args) { BinUtils.initArgs(args, this); List<String> filelist = FileUtils.getFileList(input_path, input_ext, false); Collections.sort(filelist); decoder = new NLPDecoder(IOUtils.createFileInputStream(configuration_file)); decoder.decode(filelist, output_ext, format, threads); }
public NLPDecode(String[] args) { BinUtils.initArgs(args, this); List<String> filelist = FileUtils.getFileList(input_path, input_ext, false); Collections.sort(filelist); decoder = new NLPDecoder(IOUtils.createFileInputStream(configuration_file)); decoder.decode(filelist, output_ext, format, threads); }
public void convert(InputStream in, OutputStream out) throws Exception { BufferedReader reader = IOUtils.createBufferedReader(in); PrintStream fout = IOUtils.createBufferedPrintStream(out); List<ItToken> list = new ArrayList<>(); NLPNode[] nodes; String line; String[] t; while ((line = reader.readLine()) != null && !(line = line.trim()).isEmpty()) { t = Splitter.splitTabs(line); list.add(new ItToken(t[0], t[1])); } for (List<ItToken> tokens : tokenizer.segmentize(list)) { nodes = decoder.toNodeArray(tokens, token -> create(token)); decoder.decode(nodes); check(nodes); fout.println(decoder.toString(nodes)+"\n"); } reader.close(); fout.close(); }
public void tagSentence(List<Word> sentenceWords) { NLPNode[] decodedNodes = nlpDecoder.decode(toNodeArray(sentenceWords)); for(int i = 0; i < sentenceWords.size(); i++) { Word word = sentenceWords.get(i); word.setHead(decodedNodes[i + 1].getDependencyHead().getID()); word.setDepLabel(decodedNodes[i + 1].getDependencyLabel()); if(word.getPosTag() != null && word.getPosTag().equals("CH")) word.setDepLabel("punct"); } }
public void convert(InputStream in, OutputStream out) throws Exception { BufferedReader reader = IOUtils.createBufferedReader(in); PrintStream fout = IOUtils.createBufferedPrintStream(out); List<ItToken> list = new ArrayList<>(); NLPNode[] nodes; String line; String[] t; while ((line = reader.readLine()) != null && !(line = line.trim()).isEmpty()) { t = Splitter.splitTabs(line); list.add(new ItToken(t[0], t[1])); } for (List<ItToken> tokens : tokenizer.segmentize(list)) { nodes = decoder.toNodeArray(tokens, token -> create(token)); decoder.decode(nodes); check(nodes); fout.println(decoder.toString(nodes)+"\n"); } reader.close(); fout.close(); }
static public void main(String[] args) throws Exception { final String configFile = "/Users/jdchoi/Documents/EmoryNLP/nlp4j/src/main/resources/edu/emory/mathcs/nlp/configuration/config-decode-deident.xml"; final String inputDir = "/Users/jdchoi/Desktop/radiology/Q2"; final String inputExt = "txt"; final String outputExt = "tsv"; final String outputFormat = AbstractNLPDecoder.FORMAT_LINE; NLPDecoder nlp4j = new NLPDecoder(IOUtils.createFileInputStream(configFile)); for (String inputFile : FileUtils.getFileList(inputDir, inputExt)) { System.out.println(inputFile); String outputFile = inputFile+"."+outputExt; nlp4j.decode(IOUtils.createFileInputStream(inputFile), IOUtils.createFileOutputStream(outputFile), outputFormat); } } }
static public void main(String[] args) throws Exception { final String configFile = "/Users/jdchoi/Documents/EmoryNLP/nlp4j/src/main/resources/edu/emory/mathcs/nlp/configuration/config-decode-deident.xml"; final String inputDir = "/Users/jdchoi/Desktop/radiology/Q2"; final String inputExt = "txt"; final String outputExt = "tsv"; final String outputFormat = AbstractNLPDecoder.FORMAT_LINE; NLPDecoder nlp4j = new NLPDecoder(IOUtils.createFileInputStream(configFile)); for (String inputFile : FileUtils.getFileList(inputDir, inputExt)) { System.out.println(inputFile); String outputFile = inputFile+"."+outputExt; nlp4j.decode(IOUtils.createFileInputStream(inputFile), IOUtils.createFileOutputStream(outputFile), outputFormat); } } }
decoder.decode(sentence); for (int x = 1; x < sentence.length; x++) { total++;
decoder.decode(sentence); for (int x = 1; x < sentence.length; x++) { total++;