/*
* ARX: Powerful Data Anonymization
* Copyright 2012 - 2017 Fabian Prasser, Florian Kohlmayer and contributors
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.deidentifier.arx.examples;
import java.io.IOException;
import java.util.Iterator;
import org.deidentifier.arx.ARXAnonymizer;
import org.deidentifier.arx.ARXConfiguration;
import org.deidentifier.arx.ARXLattice.ARXNode;
import org.deidentifier.arx.ARXResult;
import org.deidentifier.arx.AttributeType;
import org.deidentifier.arx.Data;
import org.deidentifier.arx.Data.DefaultData;
import org.deidentifier.arx.DataType;
import org.deidentifier.arx.aggregates.HierarchyBuilderIntervalBased;
import org.deidentifier.arx.aggregates.HierarchyBuilderIntervalBased.Range;
import org.deidentifier.arx.aggregates.HierarchyBuilderRedactionBased;
import org.deidentifier.arx.aggregates.HierarchyBuilderRedactionBased.Order;
import org.deidentifier.arx.criteria.KAnonymity;
import org.deidentifier.arx.metric.v2.__MetricV2;
import cern.colt.Arrays;
/**
* This class implements an example for using the generalized loss metric with different types of
* generalization hierarchies.
*
* @author Fabian Prasser
* @author Florian Kohlmayer
*/
public class Example25 extends Example {
/**
* Entry point.
*
* @param args
* The arguments
* @throws IOException
*/
public static void main(String[] args) throws IOException {
// Define data
DefaultData data = Data.create();
data.add("age", "gender", "zipcode");
data.add("34", "male", "81667");
data.add("45", "female", "81675");
data.add("66", "male", "81925");
data.add("70", "female", "81931");
data.add("34", "female", "81931");
data.add("70", "male", "81931");
data.add("45", "male", "81931");
// Define hierarchies
HierarchyBuilderIntervalBased<Long> builder1 = HierarchyBuilderIntervalBased.create(
DataType.INTEGER,
new Range<Long>(0l,0l,0l),
new Range<Long>(99l,99l,99l));
// Define base intervals
builder1.setAggregateFunction(DataType.INTEGER.createAggregate().createIntervalFunction(true, false));
builder1.addInterval(0l, 20l);
builder1.addInterval(20l, 33l);
// Define grouping fanouts
builder1.getLevel(0).addGroup(2);
builder1.getLevel(1).addGroup(3);
HierarchyBuilderRedactionBased<?> builder2 = HierarchyBuilderRedactionBased.create(Order.RIGHT_TO_LEFT,
Order.RIGHT_TO_LEFT,
' ',
'*');
// builder2.setDomainProperties(100000, 10, 5);
// builder2.setDomainAndAlphabetSize(30000, 10, 5);
// builder2.setDomainSize(30000, 5);
builder2.setAlphabetSize(10, 5);
data.getDefinition().setAttributeType("age", builder1);
data.getDefinition().setAttributeType("gender", AttributeType.QUASI_IDENTIFYING_ATTRIBUTE);
data.getDefinition().setAttributeType("zipcode", builder2);
// Create an instance of the anonymizer
ARXAnonymizer anonymizer = new ARXAnonymizer();
ARXConfiguration config = ARXConfiguration.create();
config.addPrivacyModel(new KAnonymity(3));
config.setMaxOutliers(0d);
config.setQualityModel(__MetricV2.createLossMetric());
config.setSuppressionAlwaysEnabled(false);
ARXResult result = anonymizer.anonymize(data, config);
// Process results
for (ARXNode[] level : result.getLattice().getLevels()) {
for (ARXNode node : level) {
Iterator<String[]> transformed = result.getOutput(node, false).iterator();
System.out.println("Transformation : "+Arrays.toString(node.getTransformation()));
System.out.println("InformationLoss: "+node.getHighestScore());
while (transformed.hasNext()) {
System.out.print(" ");
System.out.println(Arrays.toString(transformed.next()));
}
}
}
}
}