public MapredParquetInputFormat() { this(new ParquetInputFormat<ArrayWritable>(DataWritableReadSupport.class)); }
protected static FileSplit getFileSplit(Job vectorJob) throws IOException, InterruptedException { ParquetInputFormat parquetInputFormat = new ParquetInputFormat(GroupReadSupport.class); InputSplit split = (InputSplit) parquetInputFormat.getSplits(vectorJob).get(0); FileSplit fsplit = new FileSplit(file, 0L, split.getLength(), split.getLocations()); return fsplit; }
public PentahoParquetInputFormat() throws Exception { logger.info( "We are initializing parquet input format" ); inClassloader( () -> { ConfigurationProxy conf = new ConfigurationProxy(); job = Job.getInstance( conf ); nativeParquetInputFormat = new ParquetInputFormat<>(); ParquetInputFormat.setReadSupportClass( job, PentahoParquetReadSupport.class ); ParquetInputFormat.setTaskSideMetaData( job, false ); } ); }