/** * * Licensed to the Apache Software Foundation (ASF) under one * or more contributor license agreements. See the NOTICE file * distributed with this work for additional information * regarding copyright ownership. The ASF licenses this file * to you under the Apache License, Version 2.0 (the * "License"); you may not use this file except in compliance * with the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.apache.hadoop.hbase.mob; import java.io.IOException; import org.apache.commons.logging.Log; import org.apache.commons.logging.LogFactory; import org.apache.hadoop.conf.Configuration; import org.apache.hadoop.conf.Configured; import org.apache.hadoop.fs.FileSystem; import org.apache.hadoop.hbase.HBaseConfiguration; import org.apache.hadoop.hbase.HColumnDescriptor; import org.apache.hadoop.hbase.HConstants; import org.apache.hadoop.hbase.HTableDescriptor; import org.apache.hadoop.hbase.TableName; import org.apache.hadoop.hbase.classification.InterfaceAudience; import org.apache.hadoop.hbase.client.Admin; import org.apache.hadoop.hbase.client.Connection; import org.apache.hadoop.hbase.client.ConnectionFactory; import org.apache.hadoop.hbase.client.HBaseAdmin; import org.apache.hadoop.hbase.io.hfile.CacheConfig; import org.apache.hadoop.hbase.util.Bytes; import org.apache.hadoop.hbase.util.EnvironmentEdgeManager; import org.apache.hadoop.util.Tool; import org.apache.hadoop.util.ToolRunner; /** * The cleaner to delete the expired MOB files. */ @InterfaceAudience.Private public class ExpiredMobFileCleaner extends Configured implements Tool { private static final Log LOG = LogFactory.getLog(ExpiredMobFileCleaner.class); /** * Cleans the MOB files when they're expired and their min versions are 0. * If the latest timestamp of Cells in a MOB file is older than the TTL in the column family, * it's regarded as expired. This cleaner deletes them. * At a time T0, the cells in a mob file M0 are expired. If a user starts a scan before T0, those * mob cells are visible, this scan still runs after T0. At that time T1, this mob file M0 * is expired, meanwhile a cleaner starts, the M0 is archived and can be read in the archive * directory. * @param tableName The current table name. * @param family The current family. */ public void cleanExpiredMobFiles(String tableName, HColumnDescriptor family) throws IOException { Configuration conf = getConf(); TableName tn = TableName.valueOf(tableName); FileSystem fs = FileSystem.get(conf); LOG.info("Cleaning the expired MOB files of " + family.getNameAsString() + " in " + tableName); // disable the block cache. Configuration copyOfConf = new Configuration(conf); copyOfConf.setFloat(HConstants.HFILE_BLOCK_CACHE_SIZE_KEY, 0f); CacheConfig cacheConfig = new CacheConfig(copyOfConf); MobUtils.cleanExpiredMobFiles(fs, conf, tn, family, cacheConfig, EnvironmentEdgeManager.currentTime()); } public static void main(String[] args) throws Exception { Configuration conf = HBaseConfiguration.create(); ToolRunner.run(conf, new ExpiredMobFileCleaner(), args); } private void printUsage() { System.err.println("Usage:\n" + "--------------------------\n" + ExpiredMobFileCleaner.class.getName() + " tableName familyName"); System.err.println(" tableName The table name"); System.err.println(" familyName The column family name"); } @edu.umd.cs.findbugs.annotations.SuppressWarnings(value="REC_CATCH_EXCEPTION", justification="Intentional") public int run(String[] args) throws Exception { if (args.length != 2) { printUsage(); return 1; } String tableName = args[0]; String familyName = args[1]; TableName tn = TableName.valueOf(tableName); HBaseAdmin.available(getConf()); Connection connection = ConnectionFactory.createConnection(getConf()); Admin admin = connection.getAdmin(); try { HTableDescriptor htd = admin.getTableDescriptor(tn); HColumnDescriptor family = htd.getFamily(Bytes.toBytes(familyName)); if (family == null || !family.isMobEnabled()) { throw new IOException("Column family " + familyName + " is not a MOB column family"); } if (family.getMinVersions() > 0) { throw new IOException( "The minVersions of the column family is not 0, could not be handled by this cleaner"); } cleanExpiredMobFiles(tableName, family); return 0; } finally { try { admin.close(); } catch (IOException e) { LOG.error("Failed to close the HBaseAdmin.", e); } try { connection.close(); } catch (IOException e) { LOG.error("Failed to close the connection.", e); } } } }