edu.illinois.cs.cogcomp.core.io.LineIO.slurp java code examples

/**
 * Read the contents of a file using the default charset and return as a single string
 */
public static String slurp(String fileName) throws FileNotFoundException {
  return slurp(fileName, Charset.defaultCharset().name());
}

/**
 * Read the contents of a file using the default charset and return as a single string
 */
public static String slurp(String fileName) throws FileNotFoundException {
  return slurp(fileName, Charset.defaultCharset().name());
}

public TextAnnotation RunPipelineOnFile(String fileName) throws FileNotFoundException,
    AnnotatorException {
  String text = LineIO.slurp(fileName);
  boolean forceUpdate = true; // in actual use, this will usually be 'false'
  return pipeline.createAnnotatedTextAnnotation("", "", text);
}

public TextAnnotation RunPipelineOnFile(String fileName) throws FileNotFoundException,
    AnnotatorException {
  String text = LineIO.slurp(fileName);
  boolean forceUpdate = true; // in actual use, this will usually be 'false'
  return pipeline.createAnnotatedTextAnnotation("", "", text);
}

/**
   * Read serialized record from file and deserialize it. Expects Thrift serialization format, one
   * record in a single file.
   *
   * @param fileName Name of file to read from
   * @return A text annotation
   */
public static TextAnnotation deserializeTextAnnotationFromFile(String fileName, boolean isJson)
    throws Exception {
  File file = new File(fileName);
  if (!file.exists())
    throw new IOException("ERROR: " + NAME + ".deserializeTextAnnotationFromFile(): file '"
        + fileName + "' does not exist.");
  if (!isJson)
    return deserializeTextAnnotationFromBytes(FileUtils.readFileToByteArray(file));
  else
    return SerializationHelper.deserializeFromJson(LineIO.slurp(fileName));
}

/**
   * Read serialized record from file and deserialize it. Expects Thrift serialization format, one
   * record in a single file.
   *
   * @param fileName Name of file to read from
   * @return A text annotation
   */
public static TextAnnotation deserializeTextAnnotationFromFile(String fileName, boolean isJson)
    throws Exception {
  File file = new File(fileName);
  if (!file.exists())
    throw new IOException("ERROR: " + NAME + ".deserializeTextAnnotationFromFile(): file '"
        + fileName + "' does not exist.");
  if (!isJson)
    return deserializeTextAnnotationFromBytes(FileUtils.readFileToByteArray(file));
  else
    return SerializationHelper.deserializeFromJson(LineIO.slurp(fileName));
}

/**
 * given an entry from the corpus file list generated by {@link #getFileListing()} , parse its
 * contents and get zero or more TextAnnotation objects.
 *
 * @param corpusFileListEntry corpus file containing content to be processed
 * @return List of TextAnnotation objects extracted from the corpus file
 */
@Override
public List<TextAnnotation> getAnnotationsFromFile(List<Path> corpusFileListEntry) throws Exception {
  Path sourceTextAndAnnotationFile = corpusFileListEntry.get(0);
  fileId =
      sourceTextAndAnnotationFile.getName(sourceTextAndAnnotationFile.getNameCount() - 1)
          .toString();
  logger.debug("read source file {}", fileId);
  numFiles++;
  String fileText = LineIO.slurp(sourceTextAndAnnotationFile.toString());
  newFileText = this.stripText(fileText);
  List<TextAnnotation> taList = new ArrayList<>(1);
  TextAnnotation ta = taBuilder.createTextAnnotation(corpusName, fileId, newFileText.toString());
  if (null != ta) {
    taList.add(ta);
    numTextAnnotations++;
  }
  return taList;
}

/**
 * given an entry from the corpus file list generated by {@link #getFileListing()} , parse its
 * contents and get zero or more TextAnnotation objects. This allows for the case where corpus
 * annotations are provided in standoff format in one or more files separate from the source
 * document.  In such cases, the first file in the list should contain the source document
 * and the rest should be the corresponding markup files.
 *
 * In this default implementation, it is assumed that a single file contains both source and markup.
 *
 * @param corpusFileListEntry a list of files, the first of which is a source file.
 * @return List of TextAnnotation objects extracted from the corpus file.
 */
@Override
public List<XmlTextAnnotation> getAnnotationsFromFile(List<Path> corpusFileListEntry) throws Exception {
  Path sourceTextAndAnnotationFile = corpusFileListEntry.get(0);
  fileId =
      sourceTextAndAnnotationFile.getName(sourceTextAndAnnotationFile.getNameCount() - 1)
          .toString();
  logger.debug("read source file {}", fileId);
  numFiles++;
  String fileText = LineIO.slurp(sourceTextAndAnnotationFile.toString());
  List<XmlTextAnnotation> xmlTaList = new ArrayList<>(1);
  XmlTextAnnotation xmlTa = xmlTextAnnotationMaker.createTextAnnotation(fileText, this.corpusName, fileId);
  if (null != xmlTa) {
    xmlTaList.add(xmlTa);
    numTextAnnotations++;
  }
  return xmlTaList;
}

/**
 * return the next annotation object. Don't forget to increment currentAnnotationId.
 *
 * @return an annotation object.
 */
@Override
public XmlTextAnnotation next() {
  String data;
  try {
    data = LineIO.slurp(currentfile);
  } catch (FileNotFoundException e1) {
    this.badFiles.add(this.currentfile);
    return null;
  } catch (Throwable e1) {
    e1.printStackTrace();
    return null;
  }
  try {
    XmlTextAnnotation ta = nextAnnotation(data, currentfile);
    return ta;
  } catch (AnnotatorException e) {
    e.printStackTrace();
    throw new IllegalStateException(e);
  }
}

/**
 * given an entry from the corpus file list generated by {@link #getFileListing()} , parse its
 * contents and get zero or more TextAnnotation objects. This allows for the case where corpus
 * annotations are provided in standoff format in one or more files separate from the source
 * document.  In such cases, the first file in the list should contain the source document
 * and the rest should be the corresponding markup files.
 *
 * In this default implementation, it is assumed that a single file contains both source and markup.
 *
 * @param corpusFileListEntry a list of files, the first of which is a source file.
 * @return List of TextAnnotation objects extracted from the corpus file.
 */
@Override
public List<XmlTextAnnotation> getAnnotationsFromFile(List<Path> corpusFileListEntry) throws Exception {
  Path sourceTextAndAnnotationFile = corpusFileListEntry.get(0);
  fileId =
      sourceTextAndAnnotationFile.getName(sourceTextAndAnnotationFile.getNameCount() - 1)
          .toString();
  logger.debug("read source file {}", fileId);
  numFiles++;
  String fileText = LineIO.slurp(sourceTextAndAnnotationFile.toString());
  List<XmlTextAnnotation> xmlTaList = new ArrayList<>(1);
  XmlTextAnnotation xmlTa = xmlTextAnnotationMaker.createTextAnnotation(fileText, this.corpusName, fileId);
  if (null != xmlTa) {
    xmlTaList.add(xmlTa);
    numTextAnnotations++;
  }
  return xmlTaList;
}

/**
 * return the next annotation object. Don't forget to increment currentAnnotationId.
 *
 * @return an annotation object.
 */
@Override
public XmlTextAnnotation next() {
  String data;
  try {
    data = LineIO.slurp(currentfile);
  } catch (FileNotFoundException e1) {
    this.badFiles.add(this.currentfile);
    return null;
  } catch (Throwable e1) {
    e1.printStackTrace();
    return null;
  }
  try {
    XmlTextAnnotation ta = nextAnnotation(data, currentfile);
    return ta;
  } catch (AnnotatorException e) {
    e.printStackTrace();
    throw new IllegalStateException(e);
  }
}

/**
 * given an entry from the corpus file list generated by {@link #getFileListing()} , parse its
 * contents and get zero or more TextAnnotation objects.
 *
 * @param corpusFileListEntry corpus file containing content to be processed
 * @return List of TextAnnotation objects extracted from the corpus file
 */
@Override
public List<TextAnnotation> getAnnotationsFromFile(List<Path> corpusFileListEntry) throws Exception {
  Path sourceTextAndAnnotationFile = corpusFileListEntry.get(0);
  fileId =
      sourceTextAndAnnotationFile.getName(sourceTextAndAnnotationFile.getNameCount() - 1)
          .toString();
  logger.debug("read source file {}", fileId);
  numFiles++;
  String fileText = LineIO.slurp(sourceTextAndAnnotationFile.toString());
  newFileText = this.stripText(fileText);
  List<TextAnnotation> taList = new ArrayList<>(1);
  TextAnnotation ta = taBuilder.createTextAnnotation(corpusName, fileId, newFileText.toString());
  if (null != ta) {
    taList.add(ta);
    numTextAnnotations++;
  }
  return taList;
}

String file = LineIO.slurp(parallelpath + "/en-" + parid);
System.out.println("Trying to read: " + parallelpath + "/en-" + parid);

TextAnnotation ta;
try {
  ta = SerializationHelper.deserializeFromJson(LineIO.slurp(file));
} catch (Exception e) {
  logger.error("Error while reading file {}\n{}", file, e.getMessage());

private List<TextAnnotation> buildTextAnnotation(Path textPath, Path sentPath, Path tokPath, Path pennPath) throws FileNotFoundException, XMLStreamException {
  String text = LineIO.slurp(textPath.toFile().getAbsolutePath());
  List<Pair<String, IntPair>> tokenInfo = tokenParser.parseFile(tokPath.toFile().getAbsolutePath());
  Pair<List<SentenceStaxParser.MascSentence>, List<SentenceStaxParser.MascSentenceGroup>> sentenceInfo =

private List<TextAnnotation> buildTextAnnotation(Path textPath, Path sentPath, Path tokPath, Path pennPath) throws FileNotFoundException, XMLStreamException {
  String text = LineIO.slurp(textPath.toFile().getAbsolutePath());
  List<Pair<String, IntPair>> tokenInfo = tokenParser.parseFile(tokPath.toFile().getAbsolutePath());
  Pair<List<SentenceStaxParser.MascSentence>, List<SentenceStaxParser.MascSentenceGroup>> sentenceInfo =

try
  input = LineIO.slurp( inFile );

String input = null;
try {
  input = LineIO.slurp(inFile);
} catch (FileNotFoundException e) {
  e.printStackTrace();

String document = LineIO.slurp(file.getCanonicalPath());

String document = LineIO.slurp(file.getCanonicalPath());

Javadoc

Read the contents of a file using the default charset and return as a single string

Popular methods of LineIO

read
This function reads a file line-by-line and converts each line into an object using a transformer th
write
This function writes a list of objects into a file, one per line. Each object is transformed into a
readFromClasspath
This searches for the file on the classpath before reading it. If it doesn't find the file, it throw
append
Append a string to a file
readGZip
This function reads a gzipped file line-by-line and converts each line into an object using a transf
getInputStream
This looks around to find the file, then returns an open inputstream. This checks the classpath firs
writeGZip
This function writes a list of objects into a Gzipped file, one per line. Each object is transformed

Popular in Java

Running tasks concurrently on multiple threads
putExtra (Intent)
setScale (BigDecimal)
getOriginalFilename (MultipartFile)
Return the original filename in the client's filesystem.This may contain path information depending
SocketException (java.net)
This SocketException may be thrown during socket creation or setting options, and is the superclass
List (java.util)
An ordered collection (also known as a sequence). The user of this interface has precise control ove
Stack (java.util)
Stack is a Last-In/First-Out(LIFO) data structure which represents a stack of objects. It enables u
ConcurrentHashMap (java.util.concurrent)
A plug-in replacement for JDK1.5 java.util.concurrent.ConcurrentHashMap. This version is based on or
LogFactory (org.apache.commons.logging)
Factory for creating Log instances, with discovery and configuration features similar to that employ
Location (org.springframework.beans.factory.parsing)
Class that models an arbitrary location in a Resource.Typically used to track the location of proble
Best plugins for Eclipse

How to use slurpmethodin edu.illinois.cs.cogcomp.core.io.LineIO

Best Java code snippets using edu.illinois.cs.cogcomp.core.io.LineIO.slurp (Showing top 20 results out of 315)

How to use
slurp
method
in
edu.illinois.cs.cogcomp.core.io.LineIO