org.apache.hadoop.hive.serde2.avro.AvroDeserializer.worker java code examples

private Object deserializeMap(Object datum, Schema fileSchema, Schema mapSchema, MapTypeInfo columnType)
    throws AvroSerdeException {
 // Avro only allows maps with Strings for keys, so we only have to worry
 // about deserializing the values
 Map<String, Object> map = new HashMap<String, Object>();
 Map<CharSequence, Object> mapDatum = (Map)datum;
 Schema valueSchema = mapSchema.getValueType();
 TypeInfo valueTypeInfo = columnType.getMapValueTypeInfo();
 for (CharSequence key : mapDatum.keySet()) {
  Object value = mapDatum.get(key);
  map.put(key.toString(), worker(value, fileSchema == null ? null : fileSchema.getValueType(),
    valueSchema, valueTypeInfo));
 }
 return map;
}

private List<Object> workerBase(List<Object> objectRow, Schema fileSchema, List<String> columnNames,
                List<TypeInfo> columnTypes, GenericRecord record)
    throws AvroSerdeException {
 for(int i = 0; i < columnNames.size(); i++) {
  TypeInfo columnType = columnTypes.get(i);
  String columnName = columnNames.get(i);
  Object datum = record.get(columnName);
  Schema datumSchema = record.getSchema().getField(columnName).schema();
  Schema.Field field = AvroSerdeUtils.isNullableType(fileSchema)?AvroSerdeUtils.getOtherTypeFromNullableType(fileSchema).getField(columnName):fileSchema.getField(columnName);
  objectRow.add(worker(datum, field == null ? null : field.schema(), datumSchema, columnType));
 }
 return objectRow;
}

private Object deserializeUnion(Object datum, Schema fileSchema, Schema recordSchema,
                UnionTypeInfo columnType) throws AvroSerdeException {
 // Calculate tags individually since the schema can evolve and can have different tags. In worst case, both schemas are same
 // and we would end up doing calculations twice to get the same tag
 int fsTag = GenericData.get().resolveUnion(fileSchema, datum); // Determine index of value from fileSchema
 int rsTag = GenericData.get().resolveUnion(recordSchema, datum); // Determine index of value from recordSchema
 Object desered = worker(datum, fileSchema == null ? null : fileSchema.getTypes().get(fsTag),
   recordSchema.getTypes().get(rsTag), columnType.getAllUnionObjectTypeInfos().get(rsTag));
 return new StandardUnionObjectInspector.StandardUnion((byte)rsTag, desered);
}

List<Object> listContents = new ArrayList<Object>(listData.size());
for(Object obj : listData) {
 listContents.add(worker(obj, fileSchema == null ? null : fileSchema.getElementType(), listSchema,
   columnType.getListElementTypeInfo()));

private List<Object> workerBase(List<Object> objectRow, List<String> columnNames,
                List<TypeInfo> columnTypes, GenericRecord record)
    throws AvroSerdeException {
 for(int i = 0; i < columnNames.size(); i++) {
  TypeInfo columnType = columnTypes.get(i);
  String columnName = columnNames.get(i);
  Object datum = record.get(columnName);
  Schema datumSchema = record.getSchema().getField(columnName).schema();
  objectRow.add(worker(datum, datumSchema, columnType));
 }
 return objectRow;
}

private Object deserializeUnion(Object datum, Schema fileSchema, Schema recordSchema,
                UnionTypeInfo columnType) throws AvroSerdeException {
 int tag = GenericData.get().resolveUnion(recordSchema, datum); // Determine index of value
 Object desered = worker(datum, fileSchema == null ? null : fileSchema.getTypes().get(tag),
   recordSchema.getTypes().get(tag), columnType.getAllUnionObjectTypeInfos().get(tag));
 return new StandardUnionObjectInspector.StandardUnion((byte)tag, desered);
}

private Object deserializeMap(Object datum, Schema fileSchema, Schema mapSchema, MapTypeInfo columnType)
    throws AvroSerdeException {
 // Avro only allows maps with Strings for keys, so we only have to worry
 // about deserializing the values
 Map<String, Object> map = new HashMap<String, Object>();
 Map<CharSequence, Object> mapDatum = (Map)datum;
 Schema valueSchema = mapSchema.getValueType();
 TypeInfo valueTypeInfo = columnType.getMapValueTypeInfo();
 for (CharSequence key : mapDatum.keySet()) {
  Object value = mapDatum.get(key);
  map.put(key.toString(), worker(value, fileSchema == null ? null : fileSchema.getValueType(),
    valueSchema, valueTypeInfo));
 }
 return map;
}

private Object deserializeMap(Object datum, Schema fileSchema, Schema mapSchema, MapTypeInfo columnType)
    throws AvroSerdeException {
 // Avro only allows maps with Strings for keys, so we only have to worry
 // about deserializing the values
 Map<String, Object> map = new HashMap<String, Object>();
 Map<CharSequence, Object> mapDatum = (Map)datum;
 Schema valueSchema = mapSchema.getValueType();
 TypeInfo valueTypeInfo = columnType.getMapValueTypeInfo();
 for (CharSequence key : mapDatum.keySet()) {
  Object value = mapDatum.get(key);
  map.put(key.toString(), worker(value, fileSchema == null ? null : fileSchema.getValueType(),
    valueSchema, valueTypeInfo));
 }
 return map;
}

private Object deserializeUnion(Object datum, Schema fileSchema, Schema recordSchema,
                UnionTypeInfo columnType) throws AvroSerdeException {
 int tag = GenericData.get().resolveUnion(recordSchema, datum); // Determine index of value
 Object desered = worker(datum, fileSchema == null ? null : fileSchema.getTypes().get(tag),
   recordSchema.getTypes().get(tag), columnType.getAllUnionObjectTypeInfos().get(tag));
 return new StandardUnionObjectInspector.StandardUnion((byte)tag, desered);
}

private Object deserializeUnion(Object datum, Schema fileSchema, Schema recordSchema,
                UnionTypeInfo columnType) throws AvroSerdeException {
 int tag = GenericData.get().resolveUnion(recordSchema, datum); // Determine index of value
 Object desered = worker(datum, fileSchema == null ? null : fileSchema.getTypes().get(tag),
   recordSchema.getTypes().get(tag), columnType.getAllUnionObjectTypeInfos().get(tag));
 return new StandardUnionObjectInspector.StandardUnion((byte)tag, desered);
}

private Object deserializeMap(Object datum, Schema fileSchema, Schema mapSchema, MapTypeInfo columnType)
    throws AvroSerdeException {
 // Avro only allows maps with Strings for keys, so we only have to worry
 // about deserializing the values
 Map<String, Object> map = new HashMap<String, Object>();
 Map<CharSequence, Object> mapDatum = (Map)datum;
 Schema valueSchema = mapSchema.getValueType();
 TypeInfo valueTypeInfo = columnType.getMapValueTypeInfo();
 for (CharSequence key : mapDatum.keySet()) {
  Object value = mapDatum.get(key);
  map.put(key.toString(), worker(value, fileSchema == null ? null : fileSchema.getValueType(),
    valueSchema, valueTypeInfo));
 }
 return map;
}

private Object deserializeMap(Object datum, Schema fileSchema, Schema mapSchema, MapTypeInfo columnType)
    throws AvroSerdeException {
 // Avro only allows maps with Strings for keys, so we only have to worry
 // about deserializing the values
 Map<String, Object> map = new HashMap<String, Object>();
 Map<CharSequence, Object> mapDatum = (Map)datum;
 Schema valueSchema = mapSchema.getValueType();
 TypeInfo valueTypeInfo = columnType.getMapValueTypeInfo();
 for (CharSequence key : mapDatum.keySet()) {
  Object value = mapDatum.get(key);
  map.put(key.toString(), worker(value, fileSchema == null ? null : fileSchema.getValueType(),
    valueSchema, valueTypeInfo));
 }
 return map;
}

 private Object deserializeMap(Object datum, Schema mapSchema, MapTypeInfo columnType)
     throws AvroSerdeException {
  // Avro only allows maps with Strings for keys, so we only have to worry
  // about deserializing the values
  Map<String, Object> map = new Hashtable<String, Object>();
  Map<Utf8, Object> mapDatum = (Map)datum;
  Schema valueSchema = mapSchema.getValueType();
  TypeInfo valueTypeInfo = columnType.getMapValueTypeInfo();
  for (Utf8 key : mapDatum.keySet()) {
   Object value = mapDatum.get(key);
   map.put(key.toString(), worker(value, valueSchema, valueTypeInfo));
  }

  return map;
 }
}

private List<Object> workerBase(List<Object> objectRow, Schema fileSchema, List<String> columnNames,
                List<TypeInfo> columnTypes, GenericRecord record)
    throws AvroSerdeException {
 for(int i = 0; i < columnNames.size(); i++) {
  TypeInfo columnType = columnTypes.get(i);
  String columnName = columnNames.get(i);
  Object datum = record.get(columnName);
  Schema datumSchema = record.getSchema().getField(columnName).schema();
  Schema.Field field = AvroSerdeUtils.isNullableType(fileSchema)?AvroSerdeUtils.getOtherTypeFromNullableType(fileSchema).getField(columnName):fileSchema.getField(columnName);
  objectRow.add(worker(datum, field == null ? null : field.schema(), datumSchema, columnType));
 }
 return objectRow;
}

private List<Object> workerBase(List<Object> objectRow, Schema fileSchema, List<String> columnNames,
                List<TypeInfo> columnTypes, GenericRecord record)
    throws AvroSerdeException {
 for(int i = 0; i < columnNames.size(); i++) {
  TypeInfo columnType = columnTypes.get(i);
  String columnName = columnNames.get(i);
  Object datum = record.get(columnName);
  Schema datumSchema = record.getSchema().getField(columnName).schema();
  Schema.Field field = AvroSerdeUtils.isNullableType(fileSchema)?AvroSerdeUtils.getOtherTypeFromNullableType(fileSchema).getField(columnName):fileSchema.getField(columnName);
  objectRow.add(worker(datum, field == null ? null : field.schema(), datumSchema, columnType));
 }
 return objectRow;
}

private Object deserializeUnion(Object datum, Schema fileSchema, Schema recordSchema,
                UnionTypeInfo columnType) throws AvroSerdeException {
 // Calculate tags individually since the schema can evolve and can have different tags. In worst case, both schemas are same
 // and we would end up doing calculations twice to get the same tag
 int fsTag = GenericData.get().resolveUnion(fileSchema, datum); // Determine index of value from fileSchema
 int rsTag = GenericData.get().resolveUnion(recordSchema, datum); // Determine index of value from recordSchema
 Object desered = worker(datum, fileSchema == null ? null : fileSchema.getTypes().get(fsTag),
   recordSchema.getTypes().get(rsTag), columnType.getAllUnionObjectTypeInfos().get(rsTag));
 return new StandardUnionObjectInspector.StandardUnion((byte)rsTag, desered);
}

private List<Object> workerBase(List<Object> objectRow, Schema fileSchema, List<String> columnNames,
                List<TypeInfo> columnTypes, GenericRecord record)
    throws AvroSerdeException {
 for(int i = 0; i < columnNames.size(); i++) {
  TypeInfo columnType = columnTypes.get(i);
  String columnName = columnNames.get(i);
  Object datum = record.get(columnName);
  Schema datumSchema = record.getSchema().getField(columnName).schema();
  Schema.Field field = AvroSerdeUtils.isNullableType(fileSchema)?AvroSerdeUtils.getOtherTypeFromNullableType(fileSchema).getField(columnName):fileSchema.getField(columnName);
  objectRow.add(worker(datum, field == null ? null : field.schema(), datumSchema, columnType));
 }
 return objectRow;
}

/**
 * Extract either a null or the correct type from a Nullable type.  This is
 * horrible in that we rebuild the TypeInfo every time.
 */
private Object deserializeNullableUnion(Object datum, Schema recordSchema,
                    TypeInfo columnType) throws AvroSerdeException {
 int tag = GenericData.get().resolveUnion(recordSchema, datum); // Determine index of value
 Schema schema = recordSchema.getTypes().get(tag);
 if(schema.getType().equals(Schema.Type.NULL))
  return null;
 return worker(datum, schema, SchemaToTypeInfo.generateTypeInfo(schema));
}

private Object deserializeUnion(Object datum, Schema recordSchema,
                UnionTypeInfo columnType) throws AvroSerdeException {
 int tag = GenericData.get().resolveUnion(recordSchema, datum); // Determine index of value
 Object desered = worker(datum, recordSchema.getTypes().get(tag),
     columnType.getAllUnionObjectTypeInfos().get(tag));
 return new StandardUnionObjectInspector.StandardUnion((byte)tag, desered);
}

private List<Object> workerBase(List<Object> objectRow, Schema fileSchema, List<String> columnNames,
                List<TypeInfo> columnTypes, GenericRecord record)
    throws AvroSerdeException {
 for(int i = 0; i < columnNames.size(); i++) {
  TypeInfo columnType = columnTypes.get(i);
  String columnName = columnNames.get(i);
  Object datum = record.get(columnName);
  Schema datumSchema = record.getSchema().getField(columnName).schema();
  Schema.Field field = AvroSerdeUtils.isNullableType(fileSchema)?AvroSerdeUtils.getOtherTypeFromNullableType(fileSchema).getField(columnName):fileSchema.getField(columnName);
  objectRow.add(worker(datum, field == null ? null : field.schema(), datumSchema, columnType));
 }
 return objectRow;
}

Popular methods of AvroDeserializer

<init>
deserialize
Deserialize an Avro record, recursing into its component fields and deserializing them as well. Fiel
deserializeList
deserializeMap
deserializeStruct
deserializeUnion
workerBase
deserializeNullableUnion
Extract either a null or the correct type from a Nullable type. This is horrible in that we rebuild
deserializePrimitive

Popular in Java

Reading from database using SQL prepared statement
notifyDataSetChanged (ArrayAdapter)
putExtra (Intent)
getSharedPreferences (Context)
URLConnection (java.net)
A connection to a URL for reading or writing. For HTTP connections, see HttpURLConnection for docume
Selector (java.nio.channels)
A controller for the selection of SelectableChannel objects. Selectable channels can be registered w
Path (java.nio.file)
MessageDigest (java.security)
Uses a one-way hash function to turn an arbitrary number of bytes into a fixed-length byte sequence.
Hashtable (java.util)
A plug-in replacement for JDK1.5 java.util.Hashtable. This version is based on org.cliffc.high_scale
Executors (java.util.concurrent)
Factory and utility methods for Executor, ExecutorService, ScheduledExecutorService, ThreadFactory,
From CI to AI: The AI layer in your organization

How to use workermethodin org.apache.hadoop.hive.serde2.avro.AvroDeserializer

Best Java code snippets using org.apache.hadoop.hive.serde2.avro.AvroDeserializer.worker (Showing top 20 results out of 315)

How to use
worker
method
in
org.apache.hadoop.hive.serde2.avro.AvroDeserializer