private List<String> getFiles(String dataDir) { List<String> files = new ArrayList<>(); FilenameFilter xmlFilter = (dir, name) -> (name.startsWith("pp-") && name.endsWith(".xml") && IOUtils .isFile(dir.getAbsolutePath() + File.separator + name)); String[] xmlFiles = (new File(dataDir)).list(xmlFilter); assert xmlFiles != null; for (String fileName : xmlFiles) { String rawFileName = IOUtils.stripFileExtension(fileName); files.add(rawFileName); } return files; } }
private List<String> getFiles(String dataDir) { List<String> files = new ArrayList<>(); FilenameFilter xmlFilter = (dir, name) -> (name.startsWith("pp-") && name.endsWith(".xml") && IOUtils .isFile(dir.getAbsolutePath() + File.separator + name)); String[] xmlFiles = (new File(dataDir)).list(xmlFilter); assert xmlFiles != null; for (String fileName : xmlFiles) { String rawFileName = IOUtils.stripFileExtension(fileName); files.add(rawFileName); } return files; } }
public static String getFileStem(String path) { return stripFileExtension(getFileName(path)); }
public static String getFileStem(String path) { return stripFileExtension(getFileName(path)); }
String lemma = IOUtils.stripFileExtension(fileName);
private void readPropbankFrameData(String dir) throws Exception { frameData = new HashMap<>(); DocumentBuilderFactory dbf = DocumentBuilderFactory.newInstance(); dbf.setNamespaceAware(false); dbf.setValidating(false); for (String file : IOUtils.lsFiles(dir, (dir1, name) -> name.endsWith("xml"))) { // IOUtils.getFileName(file) doesn't work in Windows int slashIndex = file.lastIndexOf(File.separator); String fileName = file.substring(slashIndex + 1); // A hack to deal with percent-sign in nombank. There is another // file called perc-sign that will fill this void. if (fileName.contains("percent-sign.xml")) continue; DocumentBuilder db = dbf.newDocumentBuilder(); Document doc = db.parse(file); NodeList predicateElements = doc.getElementsByTagName("predicate"); for (int i = 0; i < predicateElements.getLength(); i++) { String lemma = IOUtils.stripFileExtension(fileName); FrameData fData = new FrameData(lemma); frameData.put(lemma, fData); NodeList roleSets = doc.getElementsByTagName("roleset"); addRoleSets(fileName, lemma, fData, roleSets); } } }
String lemma = IOUtils.stripFileExtension(fileName);
String lemma = IOUtils.stripFileExtension(fileName);
sense = "1-slash-10th.01"; assert sense.startsWith(IOUtils.stripFileExtension(file)) || sense.startsWith(lemma) : lemma + "\t" + sense;
sense = "1-slash-10th.01"; assert sense.startsWith(IOUtils.stripFileExtension(file)) || sense.startsWith(lemma) : lemma + "\t" + sense;
(files.length + failed.size()), failed.size()); for (String file : files) { String taHashStr = IOUtils.stripFileExtension(IOUtils.getFileName(file));
String outFileStem = IOUtils.stripFileExtension( file ); if(!textOutput){ String outFile = outDir + "/" + outFileStem + ".ser";
String outFilePrefix = IOUtils.stripFileExtension( annotationOutFile ); String fineNerOutDir = nerOutputDir + "/" + EventConstants.NER_ACE_FINE; String coarseNerOutDir = nerOutputDir + "/" + EventConstants.NER_ACE_COARSE;
String outFileStem = IOUtils.stripFileExtension(file); if (!textOutput) { String outFile = outDir + "/" + outFileStem + ".ser";