/** * Licensed to the Apache Software Foundation (ASF) under one * or more contributor license agreements. See the NOTICE file * distributed with this work for additional information * regarding copyright ownership. The ASF licenses this file * to you under the Apache License, Version 2.0 (the * "License"); you may not use this file except in compliance * with the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.apache.hadoop.hive.hbase; import java.util.ArrayList; import java.util.Arrays; import java.util.List; import org.apache.hadoop.hbase.client.Result; import org.apache.hadoop.hive.hbase.ColumnMappings.ColumnMapping; import org.apache.hadoop.hive.hbase.struct.HBaseValueFactory; import org.apache.hadoop.hive.serde2.SerDeException; import org.apache.hadoop.hive.serde2.lazy.ByteArrayRef; import org.apache.hadoop.hive.serde2.lazy.LazyFactory; import org.apache.hadoop.hive.serde2.lazy.LazyLong; import org.apache.hadoop.hive.serde2.lazy.LazyObjectBase; import org.apache.hadoop.hive.serde2.lazy.LazyStruct; import org.apache.hadoop.hive.serde2.lazy.LazyTimestamp; import org.apache.hadoop.hive.serde2.lazy.objectinspector.LazySimpleStructObjectInspector; import org.apache.hadoop.hive.serde2.objectinspector.StructField; import com.google.common.annotations.VisibleForTesting; /** * LazyObject for storing an HBase row. The field of an HBase row can be * primitive or non-primitive. */ public class LazyHBaseRow extends LazyStruct { /** * The HBase columns mapping of the row. */ private Result result; private ArrayList<Object> cachedList; private final HBaseKeyFactory keyFactory; private final List<HBaseValueFactory> valueFactories; private final ColumnMapping[] columnsMapping; @VisibleForTesting LazyHBaseRow(LazySimpleStructObjectInspector oi, ColumnMappings columnMappings) { super(oi); this.keyFactory = DefaultHBaseKeyFactory.forTest(null, columnMappings); this.valueFactories = null; this.columnsMapping = columnMappings.getColumnsMapping(); } /** * Construct a LazyHBaseRow object with the ObjectInspector. */ public LazyHBaseRow(LazySimpleStructObjectInspector oi, HBaseSerDeParameters serdeParams) { super(oi); this.keyFactory = serdeParams.getKeyFactory(); this.valueFactories = serdeParams.getValueFactories(); this.columnsMapping = serdeParams.getColumnMappings().getColumnsMapping(); } /** * Set the HBase row data(a Result writable) for this LazyStruct. * @see LazyHBaseRow#init(org.apache.hadoop.hbase.client.Result) */ public void init(Result r) { this.result = r; setParsed(false); } @Override protected LazyObjectBase createLazyField(final int fieldID, final StructField fieldRef) throws SerDeException { if (columnsMapping[fieldID].hbaseRowKey) { return keyFactory.createKey(fieldRef.getFieldObjectInspector()); } if (columnsMapping[fieldID].hbaseTimestamp) { return LazyFactory.createLazyObject(fieldRef.getFieldObjectInspector()); } if (valueFactories != null) { return valueFactories.get(fieldID).createValueObject(fieldRef.getFieldObjectInspector()); } // fallback to default return HBaseSerDeHelper.createLazyField(columnsMapping, fieldID, fieldRef.getFieldObjectInspector()); } /** * Get one field out of the HBase row. * * If the field is a primitive field, return the actual object. * Otherwise return the LazyObject. This is because PrimitiveObjectInspector * does not have control over the object used by the user - the user simply * directly uses the Object instead of going through * Object PrimitiveObjectInspector.get(Object). * * @param fieldID The field ID * @return The field as a LazyObject */ @Override public Object getField(int fieldID) { initFields(); return uncheckedGetField(fieldID); } private void initFields() { if (getFields() == null) { initLazyFields(oi.getAllStructFieldRefs()); } if (!getParsed()) { Arrays.fill(getFieldInited(), false); setParsed(true); } } /** * Get the field out of the row without checking whether parsing is needed. * This is called by both getField and getFieldsAsList. * @param fieldID The id of the field starting from 0. * @return The value of the field */ private Object uncheckedGetField(int fieldID) { LazyObjectBase[] fields = getFields(); boolean [] fieldsInited = getFieldInited(); if (!fieldsInited[fieldID]) { fieldsInited[fieldID] = true; ColumnMapping colMap = columnsMapping[fieldID]; if (!colMap.hbaseRowKey && !colMap.hbaseTimestamp && colMap.qualifierName == null) { // it is a column family // primitive type for Map<Key, Value> can be stored in binary format. Pass in the // qualifier prefix to cherry pick the qualifiers that match the prefix instead of picking // up everything ((LazyHBaseCellMap) fields[fieldID]).init( result, colMap.familyNameBytes, colMap.binaryStorage, colMap.qualifierPrefixBytes, colMap.isDoPrefixCut()); return fields[fieldID].getObject(); } if (colMap.hbaseTimestamp) { // Get the latest timestamp of all the cells as the row timestamp long timestamp = result.rawCells()[0].getTimestamp(); // from hbase-0.96.0 for (int i = 1; i < result.rawCells().length; i++) { timestamp = Math.max(timestamp, result.rawCells()[i].getTimestamp()); } LazyObjectBase lz = fields[fieldID]; if (lz instanceof LazyTimestamp) { ((LazyTimestamp) lz).getWritableObject().setTime(timestamp); } else { ((LazyLong) lz).getWritableObject().set(timestamp); } return lz.getObject(); } byte[] bytes; if (colMap.hbaseRowKey) { bytes = result.getRow(); } else { // it is a column i.e. a column-family with column-qualifier bytes = result.getValue(colMap.familyNameBytes, colMap.qualifierNameBytes); } if (bytes == null || isNull(oi.getNullSequence(), bytes, 0, bytes.length)) { fields[fieldID].setNull(); } else { ByteArrayRef ref = new ByteArrayRef(); ref.setData(bytes); fields[fieldID].init(ref, 0, bytes.length); } } return fields[fieldID].getObject(); } /** * Get the values of the fields as an ArrayList. * @return The values of the fields as an ArrayList. */ @Override public ArrayList<Object> getFieldsAsList() { initFields(); if (cachedList == null) { cachedList = new ArrayList<Object>(); } else { cachedList.clear(); } for (int i = 0; i < getFields().length; i++) { cachedList.add(uncheckedGetField(i)); } return cachedList; } @Override public Object getObject() { return this; } }