it.unimi.dsi.io.SegmentedInputStream.addBlock java code examples

/** Creats a stream with one marker in. 
 * 
 * @param in the underlying input stream.  
 * @param delimiter an array of segment delimiters.  
 */
public SegmentedInputStream( final InputStream in, final long... delimiter ) throws NullPointerException, IOException, IllegalStateException {
  this( in );
  addBlock( delimiter );
}

/** Creats a stream with one marker in.
 *
 * @param in the underlying input stream.
 * @param delimiter an array of segment delimiters.
 */
public SegmentedInputStream(final InputStream in, final long... delimiter) throws NullPointerException, IOException, IllegalStateException {
  this(in);
  addBlock(delimiter);
}

/** Creats a stream with one marker in. 
 * 
 * @param in the underlying input stream.  
 * @param delimiter an array of segment delimiters.  
 */
public SegmentedInputStream( final InputStream in, final long... delimiter ) throws NullPointerException, IOException, IllegalStateException {
  this( in );
  addBlock( delimiter );
}

private boolean nextFile() throws FileNotFoundException, IOException {
  if ( size() == 0 ) return false;
  IOUtils.closeQuietly( siStream );
  if ( ! descriptorIterator.hasNext() ) return false;
  /*
   * We assume documents contained in the same gzip file are
   * contiguous so we collect all of them until we find a different
   * file index.
   */
  TRECDocumentDescriptor currentDescriptor = firstNextDescriptor != null ? firstNextDescriptor : descriptorIterator.next();
  int currentFileIndex = currentDescriptor.fileIndex;
  if ( DEBUG ) LOGGER.debug( "Skipping to contents file " + currentFileIndex + " (" + file[ currentFileIndex ] + ")" );
  /*
   * We create the segmented input stream with all just collected
   * descriptors
   */
  siStream = new SegmentedInputStream( openFileStream( file[ currentFileIndex ] ) );
  do {
    siStream.addBlock( currentDescriptor.toSegments() );
    if ( ! descriptorIterator.hasNext() ) break;
    currentDescriptor = descriptorIterator.next();
  } while ( currentDescriptor.fileIndex == currentFileIndex );
  firstNextDescriptor = currentDescriptor; // The last assignment will be meaningless, but it won't be used anyway
  return true;
}

private boolean nextFile() throws FileNotFoundException, IOException {
  if ( size() == 0 ) return false;
  IOUtils.closeQuietly( siStream );
  if ( ! descriptorIterator.hasNext() ) return false;
  /*
   * We assume documents contained in the same gzip file are
   * contiguous so we collect all of them until we find a different
   * file index.
   */
  TRECDocumentDescriptor currentDescriptor = firstNextDescriptor != null ? firstNextDescriptor : descriptorIterator.next();
  int currentFileIndex = currentDescriptor.fileIndex;
  if ( DEBUG ) LOGGER.debug( "Skipping to contents file " + currentFileIndex + " (" + file[ currentFileIndex ] + ")" );
  /*
   * We create the segmented input stream with all just collected
   * descriptors
   */
  siStream = new SegmentedInputStream( openFileStream( file[ currentFileIndex ] ) );
  do {
    siStream.addBlock( currentDescriptor.toSegments() );
    if ( ! descriptorIterator.hasNext() ) break;
    currentDescriptor = descriptorIterator.next();
  } while ( currentDescriptor.fileIndex == currentFileIndex );
  firstNextDescriptor = currentDescriptor; // The last assignment will be meaningless, but it won't be used anyway
  return true;
}

private boolean nextFile() throws FileNotFoundException, IOException {
  if ( size() == 0 ) return false;
  IOUtils.closeQuietly( siStream );
  if ( ! descriptorIterator.hasNext() ) return false;
  /*
   * We assume documents contained in the same gzip file are
   * contiguous so we collect all of them until we find a different
   * file index.
   */
  TRECDocumentDescriptor currentDescriptor = firstNextDescriptor != null ? firstNextDescriptor : descriptorIterator.next();
  int currentFileIndex = currentDescriptor.fileIndex;
  if ( DEBUG ) LOGGER.debug( "Skipping to contents file " + currentFileIndex + " (" + file[ currentFileIndex ] + ")" );
  /*
   * We create the segmented input stream with all just collected
   * descriptors
   */
  siStream = new SegmentedInputStream( openFileStream( file[ currentFileIndex ] ) );
  do {
    siStream.addBlock( currentDescriptor.toSegments() );
    if ( ! descriptorIterator.hasNext() ) break;
    currentDescriptor = descriptorIterator.next();
  } while ( currentDescriptor.fileIndex == currentFileIndex );
  firstNextDescriptor = currentDescriptor; // The last assignment will be meaningless, but it won't be used anyway
  return true;
}

private boolean nextFile() throws FileNotFoundException, IOException {
  if ( size() == 0 ) return false;
  IOUtils.closeQuietly( siStream );
  if ( ! descriptorIterator.hasNext() ) return false;
  /*
   * We assume documents contained in the same gzip file are
   * contiguous so we collect all of them until we find a different
   * file index.
   */
  TRECDocumentDescriptor currentDescriptor = firstNextDescriptor != null ? firstNextDescriptor : descriptorIterator.next();
  int currentFileIndex = currentDescriptor.fileIndex;
  if ( DEBUG ) LOGGER.debug( "Skipping to contents file " + currentFileIndex + " (" + file[ currentFileIndex ] + ")" );
  /*
   * We create the segmented input stream with all just collected
   * descriptors
   */
  siStream = new SegmentedInputStream( openFileStream( file[ currentFileIndex ] ) );
  do {
    siStream.addBlock( currentDescriptor.toSegments() );
    if ( ! descriptorIterator.hasNext() ) break;
    currentDescriptor = descriptorIterator.next();
  } while ( currentDescriptor.fileIndex == currentFileIndex );
  firstNextDescriptor = currentDescriptor; // The last assignment will be meaningless, but it won't be used anyway
  return true;
}

Javadoc

Adds a new block defined by its array of segment delimiters.

The block has length defined by the difference between the last and first delimiter.

This method performs the initial call to #nextBlock() when the first marker is put in.

Popular methods of SegmentedInputStream

hasMoreBlocks
Checks whether there are more blocks.
nextBlock
Skips to the first segment of the next block, if any. In such case, it returns true, or false otherw
<init>
Creats a stream with one marker in.
close
Skips to the next block, closing this segmented input stream if there are no more blocks.
ensureBlocksNotEmpty
ensureNotClosed
eofInBlock
Checks if the current position is a stop marker.
nextSegment
Skips the underlying input stream to the next segment.

Popular in Java

Running tasks concurrently on multiple threads
onCreateOptionsMenu (Activity)
getResourceAsStream (ClassLoader)
runOnUiThread (Activity)
EOFException (java.io)
Thrown when a program encounters the end of a file or stream during an input operation.
Timestamp (java.sql)
A Java representation of the SQL TIMESTAMP type. It provides the capability of representing the SQL
DecimalFormat (java.text)
A concrete subclass of NumberFormat that formats decimal numbers. It has a variety of features desig
ZipFile (java.util.zip)
This class provides random read access to a zip file. You pay more to read the zip file's central di
IsNull (org.hamcrest.core)
Is the value null?
Location (org.springframework.beans.factory.parsing)
Class that models an arbitrary location in a Resource.Typically used to track the location of proble
Top Sublime Text plugins

How to use addBlockmethodin it.unimi.dsi.io.SegmentedInputStream

Best Java code snippets using it.unimi.dsi.io.SegmentedInputStream.addBlock (Showing top 7 results out of 315)

How to use
addBlock
method
in
it.unimi.dsi.io.SegmentedInputStream