/** * Licensed to the Apache Software Foundation (ASF) under one * or more contributor license agreements. See the NOTICE file * distributed with this work for additional information * regarding copyright ownership. The ASF licenses this file * to you under the Apache License, Version 2.0 (the * "License"); you may not use this file except in compliance * with the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, * software distributed under the License is distributed on an * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY * KIND, either express or implied. See the License for the * specific language governing permissions and limitations * under the License. */ package org.apache.hadoop.hive.metastore.messaging.json; import java.util.Iterator; import java.util.LinkedHashMap; import java.util.List; import java.util.Map; import javax.annotation.Nullable; import com.google.common.collect.Iterables; import org.apache.hadoop.fs.FileStatus; import org.apache.hadoop.fs.FileSystem; import org.apache.hadoop.fs.Path; import org.apache.hadoop.hive.common.FileUtils; import org.apache.hadoop.hive.metastore.api.Database; import org.apache.hadoop.hive.metastore.api.Function; import org.apache.hadoop.hive.metastore.api.Index; import org.apache.hadoop.hive.metastore.api.NotificationEvent; import org.apache.hadoop.hive.metastore.api.Partition; import org.apache.hadoop.hive.metastore.api.Table; import org.apache.hadoop.hive.metastore.messaging.AddPartitionMessage; import org.apache.hadoop.hive.metastore.messaging.AlterIndexMessage; import org.apache.hadoop.hive.metastore.messaging.AlterPartitionMessage; import org.apache.hadoop.hive.metastore.messaging.AlterTableMessage; import org.apache.hadoop.hive.metastore.messaging.CreateDatabaseMessage; import org.apache.hadoop.hive.metastore.messaging.CreateFunctionMessage; import org.apache.hadoop.hive.metastore.messaging.CreateIndexMessage; import org.apache.hadoop.hive.metastore.messaging.CreateTableMessage; import org.apache.hadoop.hive.metastore.messaging.DropDatabaseMessage; import org.apache.hadoop.hive.metastore.messaging.DropFunctionMessage; import org.apache.hadoop.hive.metastore.messaging.DropIndexMessage; import org.apache.hadoop.hive.metastore.messaging.DropPartitionMessage; import org.apache.hadoop.hive.metastore.messaging.DropTableMessage; import org.apache.hadoop.hive.metastore.messaging.InsertMessage; import org.apache.hadoop.hive.metastore.messaging.MessageDeserializer; import org.apache.hadoop.hive.metastore.messaging.MessageFactory; import org.apache.hadoop.hive.metastore.messaging.PartitionFiles; import org.apache.thrift.TBase; import org.apache.thrift.TDeserializer; import org.apache.thrift.TException; import org.apache.thrift.TSerializer; import org.apache.thrift.protocol.TJSONProtocol; import org.codehaus.jackson.JsonFactory; import org.codehaus.jackson.JsonNode; import org.codehaus.jackson.JsonParser; import org.codehaus.jackson.map.ObjectMapper; import org.codehaus.jackson.node.ObjectNode; import org.slf4j.Logger; import org.slf4j.LoggerFactory; import com.google.common.collect.Iterators; import com.google.common.collect.Lists; /** * The JSON implementation of the MessageFactory. Constructs JSON implementations of each * message-type. */ public class JSONMessageFactory extends MessageFactory { private static final Logger LOG = LoggerFactory.getLogger(JSONMessageFactory.class.getName()); private static JSONMessageDeserializer deserializer = new JSONMessageDeserializer(); private static TDeserializer thriftDeSerializer = new TDeserializer(new TJSONProtocol.Factory()); @Override public MessageDeserializer getDeserializer() { return deserializer; } @Override public String getMessageFormat() { return "json-0.2"; } @Override public CreateDatabaseMessage buildCreateDatabaseMessage(Database db) { return new JSONCreateDatabaseMessage(MS_SERVER_URL, MS_SERVICE_PRINCIPAL, db.getName(), now()); } @Override public DropDatabaseMessage buildDropDatabaseMessage(Database db) { return new JSONDropDatabaseMessage(MS_SERVER_URL, MS_SERVICE_PRINCIPAL, db.getName(), now()); } @Override public CreateTableMessage buildCreateTableMessage(Table table, Iterator<String> fileIter) { return new JSONCreateTableMessage(MS_SERVER_URL, MS_SERVICE_PRINCIPAL, table, fileIter, now()); } @Override public AlterTableMessage buildAlterTableMessage(Table before, Table after, boolean isTruncateOp) { return new JSONAlterTableMessage(MS_SERVER_URL, MS_SERVICE_PRINCIPAL, before, after, isTruncateOp, now()); } @Override public DropTableMessage buildDropTableMessage(Table table) { return new JSONDropTableMessage(MS_SERVER_URL, MS_SERVICE_PRINCIPAL, table.getDbName(), table.getTableName(), now()); } @Override public AddPartitionMessage buildAddPartitionMessage(Table table, Iterator<Partition> partitionsIterator, Iterator<PartitionFiles> partitionFileIter) { return new JSONAddPartitionMessage(MS_SERVER_URL, MS_SERVICE_PRINCIPAL, table, partitionsIterator, partitionFileIter, now()); } @Override public AlterPartitionMessage buildAlterPartitionMessage(Table table, Partition before, Partition after, boolean isTruncateOp) { return new JSONAlterPartitionMessage(MS_SERVER_URL, MS_SERVICE_PRINCIPAL, table, before, after, isTruncateOp, now()); } @Override public DropPartitionMessage buildDropPartitionMessage(Table table, Iterator<Partition> partitionsIterator) { return new JSONDropPartitionMessage(MS_SERVER_URL, MS_SERVICE_PRINCIPAL, table, getPartitionKeyValues(table, partitionsIterator), now()); } @Override public CreateFunctionMessage buildCreateFunctionMessage(Function fn) { return new JSONCreateFunctionMessage(MS_SERVER_URL, MS_SERVICE_PRINCIPAL, fn, now()); } @Override public DropFunctionMessage buildDropFunctionMessage(Function fn) { return new JSONDropFunctionMessage(MS_SERVER_URL, MS_SERVICE_PRINCIPAL, fn, now()); } @Override public CreateIndexMessage buildCreateIndexMessage(Index idx) { return new JSONCreateIndexMessage(MS_SERVER_URL, MS_SERVICE_PRINCIPAL, idx, now()); } @Override public DropIndexMessage buildDropIndexMessage(Index idx) { return new JSONDropIndexMessage(MS_SERVER_URL, MS_SERVICE_PRINCIPAL, idx, now()); } @Override public AlterIndexMessage buildAlterIndexMessage(Index before, Index after) { return new JSONAlterIndexMessage(MS_SERVER_URL, MS_SERVICE_PRINCIPAL, before, after, now()); } @Override public InsertMessage buildInsertMessage(String db, String table, Map<String, String> partKeyVals, boolean replace, Iterator<String> fileIter) { return new JSONInsertMessage(MS_SERVER_URL, MS_SERVICE_PRINCIPAL, db, table, partKeyVals, replace, fileIter, now()); } private long now() { return System.currentTimeMillis() / 1000; } static Map<String, String> getPartitionKeyValues(Table table, Partition partition) { Map<String, String> partitionKeys = new LinkedHashMap<String, String>(); for (int i = 0; i < table.getPartitionKeysSize(); ++i) partitionKeys.put(table.getPartitionKeys().get(i).getName(), partition.getValues().get(i)); return partitionKeys; } static List<Map<String, String>> getPartitionKeyValues(final Table table, Iterator<Partition> iterator) { return Lists.newArrayList(Iterators.transform(iterator, new com.google.common.base.Function<Partition, Map<String, String>>() { @Override public Map<String, String> apply(@Nullable Partition partition) { return getPartitionKeyValues(table, partition); } })); } static String createTableObjJson(Table tableObj) throws TException { TSerializer serializer = new TSerializer(new TJSONProtocol.Factory()); return serializer.toString(tableObj, "UTF-8"); } static String createPartitionObjJson(Partition partitionObj) throws TException { TSerializer serializer = new TSerializer(new TJSONProtocol.Factory()); return serializer.toString(partitionObj, "UTF-8"); } static String createFunctionObjJson(Function functionObj) throws TException { TSerializer serializer = new TSerializer(new TJSONProtocol.Factory()); return serializer.toString(functionObj, "UTF-8"); } static String createIndexObjJson(Index indexObj) throws TException { TSerializer serializer = new TSerializer(new TJSONProtocol.Factory()); return serializer.toString(indexObj, "UTF-8"); } public static ObjectNode getJsonTree(NotificationEvent event) throws Exception { return getJsonTree(event.getMessage()); } public static ObjectNode getJsonTree(String eventMessage) throws Exception { JsonParser jsonParser = (new JsonFactory()).createJsonParser(eventMessage); ObjectMapper mapper = new ObjectMapper(); return mapper.readValue(jsonParser, ObjectNode.class); } public static Table getTableObj(ObjectNode jsonTree) throws Exception { TDeserializer deSerializer = new TDeserializer(new TJSONProtocol.Factory()); Table tableObj = new Table(); String tableJson = jsonTree.get("tableObjJson").asText(); deSerializer.deserialize(tableObj, tableJson, "UTF-8"); return tableObj; } /* * TODO: Some thoughts here : We have a current todo to move some of these methods over to * MessageFactory instead of being here, so we can override them, but before we move them over, * we should keep the following in mind: * * a) We should return Iterables, not Lists. That makes sure that we can be memory-safe when * implementing it rather than forcing ourselves down a path wherein returning List is part of * our interface, and then people use .size() or somesuch which makes us need to materialize * the entire list and not change. Also, returning Iterables allows us to do things like * Iterables.transform for some of these. * b) We should not have "magic" names like "tableObjJson", because that breaks expectation of a * couple of things - firstly, that of serialization format, although that is fine for this * JSONMessageFactory, and secondly, that makes us just have a number of mappings, one for each * obj type, and sometimes, as the case is with alter, have multiples. Also, any event-specific * item belongs in that event message / event itself, as opposed to in the factory. It's okay to * have utility accessor methods here that are used by each of the messages to provide accessors. * I'm adding a couple of those here. * */ public static TBase getTObj(String tSerialized, Class<? extends TBase> objClass) throws Exception{ TBase obj = objClass.newInstance(); thriftDeSerializer.deserialize(obj, tSerialized, "UTF-8"); return obj; } public static Iterable<? extends TBase> getTObjs( Iterable<String> objRefStrs, final Class<? extends TBase> objClass) throws Exception { try { return Iterables.transform(objRefStrs, new com.google.common.base.Function<String,TBase>(){ @Override public TBase apply(@Nullable String objStr){ try { return getTObj(objStr, objClass); } catch (Exception e) { throw new RuntimeException(e); } } }); } catch (RuntimeException re){ // We have to add this bit of exception handling here, because Function.apply does not allow us to throw // the actual exception that might be a checked exception, so we wind up needing to throw a RuntimeException // with the previously thrown exception as its cause. However, since RuntimeException.getCause() returns // a throwable instead of an Exception, we have to account for the possibility that the underlying code // might have thrown a Throwable that we wrapped instead, in which case, continuing to throw the // RuntimeException is the best thing we can do. Throwable t = re.getCause(); if (t instanceof Exception){ throw (Exception) t; } else { throw re; } } } // If we do not need this format of accessor using ObjectNode, this is a candidate for removal as well public static Iterable<? extends TBase> getTObjs( ObjectNode jsonTree, String objRefListName, final Class<? extends TBase> objClass) throws Exception { Iterable<JsonNode> jsonArrayIterator = jsonTree.get(objRefListName); com.google.common.base.Function<JsonNode,String> textExtractor = new com.google.common.base.Function<JsonNode, String>() { @Nullable @Override public String apply(@Nullable JsonNode input) { return input.asText(); } }; return getTObjs(Iterables.transform(jsonArrayIterator, textExtractor), objClass); } }