/* * Licensed to the Apache Software Foundation (ASF) under one * or more contributor license agreements. See the NOTICE file * distributed with this work for additional information * regarding copyright ownership. The ASF licenses this file * to you under the Apache License, Version 2.0 (the * "License"); you may not use this file except in compliance * with the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package com.manning.hip.ch11; import com.manning.hip.common.Range; import org.apache.commons.lang.StringUtils; import org.apache.pig.FilterFunc; import org.apache.pig.FuncSpec; import org.apache.pig.data.DataType; import org.apache.pig.data.Tuple; import org.apache.pig.impl.logicalLayer.FrontendException; import org.apache.pig.impl.logicalLayer.schema.Schema; import java.io.IOException; import java.util.ArrayList; import java.util.List; import java.util.regex.Pattern; /** * This function removes tuples that contain a private IP address. */ public class IsPrivateIP extends FilterFunc { protected List<Range<Long>> ipRanges; public IsPrivateIP() { ipRanges = new ArrayList<Range<Long>>(); ipRanges.add(getRange("10.0.0.0", "10.255.255.255")); ipRanges.add(getRange("172.16.0.0", "172.31.255.255")); ipRanges.add(getRange("192.168.0.0", "192.168.255.255")); } @Override public List<FuncSpec> getArgToFuncMapping() throws FrontendException { List<FuncSpec> funcList = new ArrayList<FuncSpec>(); funcList.add(new FuncSpec(this.getClass().getName(), new Schema(new Schema.FieldSchema(null, DataType.CHARARRAY)))); return funcList; } @Override public Boolean exec(Tuple t) throws IOException { if (t == null || t.size() == 0) return false; String address = extractFieldAsString(t, 0); return address != null && matchesIp(ipToInt(address)); } public static Range<Long> getRange(String startIp, String endIp) { return new Range<Long>(ipToInt(startIp), ipToInt(endIp)); } public boolean matchesIp(long ip) { for(Range<Long> range: ipRanges) { if(range.contains(ip)) { return true; } } return false; } public String extractFieldAsString(Tuple t, int field) { String query; try { query = (String) t.get(field); if (query == null) return null; query = query.trim(); } catch (Exception e) { System.err.println( "PrivateIPFilter: failed to process input; error - " + e.getMessage()); return null; } if (query.equals("")) { return null; } return query; } public static long ipToInt(String addr) { String[] octets = StringUtils.split(addr, "."); long ip = 0; for (String octet : octets) { ip = (ip << 8) + Integer.valueOf(octet); } return ip; } }