TrackingMultimap.java example

Explorer

concourse-master
- concourse-cli
  - src
    - main
      - java
        com
        cinchapi
        concourse
        cli
        CommandLineInterface.java
        CommandLineInterfaceRunner.java
        NoOptions.java
        Options.java
        util
        CommandLineInterfaces.java
- concourse-driver-java
  - src
    - main
      - java
        com
        cinchapi
        concourse
        CachedConnectionPool.java
        Calculator.java
        Concourse.java
        ConcourseThriftDriver.java
        ConnectionPool.java
        Constants.java
        DuplicateEntryException.java
        FixedConnectionPool.java
        InvalidArgumentException.java
        Link.java
        ParseException.java
        Tag.java
        Timestamp.java
        TransactionException.java
        annotate
        CompoundOperation.java
        DoNotInvoke.java
        Incubating.java
        MustOverride.java
        PackagePrivate.java
        UtilityClass.java
        cache
        ReferenceCache.java
        config
        ConcourseClientPreferences.java
        ConcourseServerPreferences.java
        PreferencesHandler.java
        lang
        AbstractSymbol.java
        BuildableStartState.java
        BuildableState.java
        ConjunctionSymbol.java
        Criteria.java
        KeyState.java
        KeySymbol.java
        Language.java
        OperatorState.java
        OperatorSymbol.java
        ParenthesisSymbol.java
        PostfixNotationSymbol.java
        StartState.java
        State.java
        Symbol.java
        TimestampState.java
        TimestampSymbol.java
        ValueState.java
        ValueSymbol.java
        security
        ClientSecurity.java
        thrift
        AccessToken.java
        ComplexTObject.java
        ComplexTObjectType.java
        ConcourseService.java
        Diff.java
        DuplicateEntryException.java
        InvalidArgumentException.java
        ManagementException.java
        Operator.java
        ParseException.java
        SecurityException.java
        TCriteria.java
        TObject.java
        TSymbol.java
        TSymbolType.java
        TransactionException.java
        TransactionToken.java
        Type.java
        time
        AtomicClock.java
        Time.java
        util
        ByteBuffers.java
        Collections.java
        ConcurrentLoadingQueue.java
        ConcurrentMaps.java
        Conversions.java
        Convert.java
        DataServices.java
        FileOps.java
        Integers.java
        KeyValue.java
        Logging.java
        MorePaths.java
        Networking.java
        Numbers.java
        Platform.java
        PrettyLinkedHashMap.java
        PrettyLinkedTableMap.java
        Processes.java
        Queues.java
        QuoteAwareStringSplitter.java
        Random.java
        RandomStringGenerator.java
        ReadOnlyIterator.java
        Resources.java
        Serializables.java
        SplitOption.java
        StringBuilderWriter.java
        StringSplitter.java
        Strings.java
        TLists.java
        TSets.java
        Timestamps.java
        Transformers.java
        TypeAdapters.java
        Version.java
        Versions.java
        ZipFiles.java
        org
        imca_cat
        pollingwatchservice
        EventingWatchService.java
        JavaUtilities.java
        PathWatchService.java
        PollingWatchEvent.java
        PollingWatchKey.java
        PollingWatchKeyState.java
        PollingWatchService.java
        PollingWatchServiceExceptionHandler.java
        PollingWatchServiceInfoHandler.java
        package-info.java
    - test
      - java
        com
        cinchapi
        concourse
        TagTest.java
        TimestampTest.java
        config
        ConcourseClientPreferencesTest.java
        lang
        CriteriaTest.java
        thrift
        ComplexTObjectTest.java
        TObjectTest.java
        util
        ByteBuffersTest.java
        ConcurrentLoadingQueueTest.java
        ConcurrentMapsTest.java
        ConvertTest.java
        FileOpsTest.java
        MorePathsTest.java
        NumbersTest.java
        QueuesTest.java
        QuoteAwareStringSplitterTest.java
        ResourcesTest.java
        SerializablesTest.java
        StringSplitterPerformanceTest.java
        StringSplitterTest.java
        StringsTest.java
        TListsTest.java
        TSetsTest.java
        TimestampsTest.java
        TransformersTest.java
        org
        imca_cat
        pollingwatchservice
        PollingWatchServiceTest.java
- concourse-ete-test-core
  - src
    - main
      - java
        com
        cinchapi
        concourse
        server
        ManagedConcourseServer.java
        test
        ClientServerTest.java
        CrossVersionTest.java
        PluginTest.java
        UpgradeTest.java
        Variables.java
        runners
        CrossVersionTestRunner.java
        util
        ConcourseCodebase.java
        ConcourseServerDownloader.java
        Processes.java
    - test
      - java
        com
        cinchapi
        concourse
        server
        ManagedConcourseServerTest.java
        util
        ConcourseCodebaseTest.java
- concourse-import
  - src
    - main
      - java
        com
        cinchapi
        concourse
        importer
        CsvImporter.java
        DelimitedLineImporter.java
        Headered.java
        Importer.java
        JsonImporter.java
        LegacyCsvImporter.java
        LineBasedImporter.java
        Transformer.java
        cli
        ImportCli.java
        util
        Importables.java
    - test
      - java
        com
        cinchapi
        concourse
        importer
        util
        ImportablesTest.java
- concourse-integration-tests
  - src
    - main
      - java
        com
        cinchapi
        concourse
        util
        StandardActions.java
    - test
      - java
        com
        cinchapi
        concourse
        AddTest.java
        AtomicOperationWofkflowTest.java
        AuditTest.java
        BrowseTest.java
        CachedConnectionPoolTest.java
        CalculateAverageTest.java
        CalculateSumTest.java
        ChronologizeTest.java
        ClearTest.java
        CompoundOperationTest.java
        ConnectTest.java
        ConnectionPoolTest.java
        CounterTest.java
        DiffTest.java
        ExceptionHandlingTest.java
        FindCriteriaTest.java
        FindOperatorConversionTest.java
        FixedConnectionPoolTest.java
        InsertTest.java
        JsonifyTest.java
        LinksToTest.java
        OperatorAliasTest.java
        QueryOnRecordIdTest.java
        ReconcileTest.java
        ReferentialIntegrityTest.java
        ResolvableLinkTest.java
        SecurityExceptionTest.java
        SetTest.java
        SmokeTest.java
        TransactionIsolationTest.java
        TransactionWorkflowTest.java
        VerifyOrSetTest.java
        bugrepro
        CON108.java
        CON167.java
        CON171.java
        CON173.java
        CON217.java
        CON279.java
        CON326.java
        CON469.java
        CON473.java
        CON474.java
        CON52.java
        CON55.java
        CON72.java
        CON75.java
        GH112.java
        GH113.java
        cli
        CommandLineInterfaceRunnerTest.java
        demo
        GettingStartedTest.java
        http
        HttpLoginTest.java
        HttpTest.java
        RestAuditTest.java
        RestInventoryTest.java
        RestTest.java
        RestWriteTest.java
        importer
        CollegeImportTest.java
        CsvImportTest.java
        DelimitedLineImporterTest.java
        ResolveKeyTest.java
        YoutubeImportTest.java
        perf
        FindThroughputTest.java
        OpsPerSecondTest.java
        TransactionThroughputTest.java
        WritePerformanceTest.java
        security
        AuthenticationTest.java
        shell
        ConcourseShellTest.java
        test
        ConcourseIntegrationTest.java
        testsuite
        BugReproSuite.java
        HttpTestSuite.java
        ImportTestSuite.java
        IntegrationTestSuite.java
        PerformanceTestSuite.java
        PreReleaseTestSuite.java
        thrift
        ThriftComplianceTest.java
- concourse-plugin-core
  - src
    - main
      - java
        com
        cinchapi
        concourse
        server
        plugin
        BackgroundExecutor.java
        BackgroundThread.java
        ConcourseRuntime.java
        ConcourseRuntimeAuthorized.java
        Packet.java
        Plugin.java
        PluginConfiguration.java
        PluginContext.java
        PluginException.java
        PluginExecutors.java
        PluginRestricted.java
        PluginRuntime.java
        RealTimePlugin.java
        RemoteAttributeExchange.java
        RemoteInvocationThread.java
        RemoteMessage.java
        RemoteMethodRequest.java
        RemoteMethodResponse.java
        RemoteStopRequest.java
        StandardPluginConfiguration.java
        StatefulConcourseService.java
        concurrent
        FileLocks.java
        SpinningFileLock.java
        data
        Dataset.java
        Insertable.java
        ObjectResultDataset.java
        ResultDataset.java
        TObjectResultDataset.java
        TrackingLinkedHashMultimap.java
        TrackingMultimap.java
        WriteEvent.java
        hook
        AfterInstallHook.java
        PluginHook.java
        io
        InterProcessCommunication.java
        MappedAtomicInteger.java
        MessageQueue.java
        PluginSerializable.java
        PluginSerializer.java
        SharedMemory.java
        util
        Versions.java
    - test
      - java
        com
        cinchapi
        concourse
        server
        plugin
        BackgroundThreadTest.java
        MockConcourseRuntime.java
        PluginConfigurationTest.java
        concurrent
        SpinningFileLockTest.java
        data
        ObjectResultDatasetTest.java
        TObjectResultDatasetTest.java
        TrackingMultimapBaseTest.java
        TrackingMultimapDataTypeTest.java
        TrackingMultimapProportionsTest.java
        TrackingMultimapTest.java
        TrackingMultimapVariableTypeTest.java
        io
        InterProcessCommunicationTest.java
        MappedAtomicIntegerTest.java
        MessageQueueTest.java
        PluginSerializerTest.java
        SharedMemoryTest.java
        TestSerializableObject.java
        util
        VersionsTest.java
- concourse-plugin-core-tests
  - src
    - test
      - java
        com
        cinchapi
        concourse
        server
        plugin
        SharedMemoryCompactionTest.java
        TestPlugin.java
- concourse-server
  - src
    - main
      - java
        com
        cinchapi
        common
        util
        IncrementalSortMap.java
        NonBlockingHashMultimap.java
        concourse
        annotate
        Alias.java
        Atomic.java
        Authorized.java
        AutoRetry.java
        Batch.java
        Experimental.java
        HistoricalRead.java
        NonPreference.java
        Restricted.java
        VersionControl.java
        lang
        Expression.java
        NaturalLanguage.java
        Parser.java
        SyntaxException.java
        ast
        AST.java
        AndTree.java
        ConjunctionTree.java
        ExpressionTree.java
        OrTree.java
        security
        AccessManager.java
        LegacyAccessManager.java
        Passwords.java
        server
        BaseConcourseServer.java
        ConcourseServer.java
        GlobalState.java
        Operations.java
        ShutdownRunner.java
        calculate
        Calculations.java
        KeyCalculation.java
        KeyRecordCalculation.java
        cli
        CommandLineInterfaceInformation.java
        EnvironmentOptions.java
        InstallPluginCli.java
        ManageDataCli.java
        ManageEnvironmentsCli.java
        ManagePluginsCli.java
        ManageUsersCli.java
        ManagementCli.java
        NoOptions.java
        Options.java
        PluginCli.java
        VersionCli.java
        concurrent
        AbstractLockService.java
        AtomicLock.java
        BlockingExecutorService.java
        ConcourseExecutors.java
        GuavaInternals.java
        LockService.java
        LockType.java
        Locks.java
        PriorityReadWriteLock.java
        RangeLockService.java
        RangeReadWriteLock.java
        RangeToken.java
        RangeTokens.java
        ReadWriteSharedLock.java
        ReferenceCountingLock.java
        Threads.java
        Token.java
        TokenReadWriteLock.java
        http
        Endpoint.java
        EndpointContainer.java
        HttpAuthToken.java
        HttpRequest.java
        HttpRequests.java
        HttpResponse.java
        HttpServer.java
        JsonEndpoint.java
        RouteArgs.java
        RoutingKey.java
        errors
        BadLoginSyntaxError.java
        BadRequest.java
        HttpError.java
        router
        HelpRouter.java
        IndexRouter.java
        webserver
        ConcourseHttpHandler.java
        io
        Bits.java
        Byteable.java
        ByteableCollections.java
        Byteables.java
        Cleaners.java
        Composite.java
        FileSystem.java
        ReRunnable.java
        Syncable.java
        process
        Callback.java
        Forkable.java
        JavaApp.java
        NoOpCallback.java
        PrematureShutdownHandler.java
        ServerProcesses.java
        jmx
        ManagedOperation.java
        management
        ConcourseManagementService.java
        model
        Position.java
        PrimaryKey.java
        Ranges.java
        TObjectSorter.java
        Text.java
        Value.java
        plugin
        PluginInstallException.java
        PluginManager.java
        storage
        Action.java
        AtomicOperation.java
        AtomicStateException.java
        AtomicSupport.java
        BaseStore.java
        BufferedStore.java
        Engine.java
        Functions.java
        Inventory.java
        InventoryTracker.java
        PermanentStore.java
        Store.java
        Stores.java
        Transaction.java
        TransactionStateException.java
        TransactionSupport.java
        VersionChangeListener.java
        VersionChangeNotifier.java
        VersionGetter.java
        Versioned.java
        cache
        BloomFilter.java
        ByteableFunnel.java
        LazyCache.java
        LoggingBloomFilter.java
        db
        Block.java
        BlockIndex.java
        BrowsableRecord.java
        CompactRevision.java
        Database.java
        PrimaryBlock.java
        PrimaryRecord.java
        PrimaryRevision.java
        Record.java
        Revision.java
        SearchBlock.java
        SearchRecord.java
        SearchRevision.java
        SecondaryBlock.java
        SecondaryRecord.java
        SecondaryRevision.java
        temp
        Buffer.java
        CapacityException.java
        Limbo.java
        Queue.java
        Write.java
        upgrade
        SmartUpgradeTask.java
        UpgradeTask.java
        UpgradeTasks.java
        task
        Upgrade0_5_0_1.java
        Upgrade0_5_0_2.java
        Upgrade1.java
        Upgrade2.java
        util
        AutoHashMap.java
        AutoMap.java
        AutoSkipListMap.java
        Commands.java
        Comparators.java
        ConcurrentSkipListMultiset.java
        Environments.java
        Logger.java
        LongBitSet.java
        MultimapViews.java
        NaturalSorter.java
        ObjectUtils.java
        Producer.java
        TArrays.java
        TCollections.java
        TMaps.java
        TStrings.java
        TestData.java
        ThreadFactories.java
        spark
        AbstractRoute.java
        Access.java
        Filter.java
        HaltException.java
        ModelAndView.java
        QueryParamsMap.java
        Request.java
        RequestResponseFactory.java
        Response.java
        ResponseTransformerRoute.java
        Route.java
        Session.java
        Spark.java
        TemplateViewRoute.java
        route
        HttpMethod.java
        RouteMatch.java
        RouteMatcher.java
        RouteMatcherFactory.java
        SimpleRouteMatcher.java
        servlet
        FilterTools.java
        SparkApplication.java
        SparkFilter.java
        template
        MustacheTemplateRoute.java
        TemplateRoute.java
        utils
        IOUtils.java
        MimeParse.java
        SparkUtils.java
        webserver
        MatcherFilter.java
        NotConsumedException.java
        RequestWrapper.java
        ResponseWrapper.java
        SparkServer.java
        SparkServerFactory.java
        SparkServerImpl.java
    - test
      - java
        com
        cinchapi
        common
        util
        IncrementalSortMapTest.java
        NonBlockingHashMultimapTest.java
        concourse
        lang
        NaturalLanguageTest.java
        ParserTest.java
        security
        AccessManagerTest.java
        LegacyAccessManagerTest.java
        server
        ConcourseServerBaseTest.java
        ConcourseServerTest.java
        cache
        LoggingBloomFilterTest.java
        concurrent
        BlockingExecutorServiceTest.java
        ConcurrencySuite.java
        LockServiceTest.java
        RangeLockServiceTest.java
        RangeTokensTest.java
        ReadWriteSharedLockTest.java
        http
        EndpointContainerTest.java
        RoutingKeyTest.java
        io
        ByteableCollectionsTest.java
        ByteableTest.java
        FileSystemTest.java
        process
        JavaAppTest.java
        model
        ModelBenchmark.java
        ModelSuite.java
        PositionTest.java
        PrimaryKeyTest.java
        TextTest.java
        ValueTest.java
        plugin
        concurrent
        CrossProcessSpinningFileLockTest.java
        io
        CrossProcessInterProcessCommunicationTest.java
        CrossProcessMessageQueueTest.java
        CrossProcessSharedMemoryTest.java
        storage
        AtomicOperationTest.java
        BufferedStoreTest.java
        EngineAtomicOperationTest.java
        EngineTest.java
        InventoryTest.java
        StorageBenchmark.java
        StorageSuite.java
        StoreSuite.java
        StoreTest.java
        StoresTest.java
        TransactionAtomicOperationTest.java
        TransactionGarbageCollectionTest.java
        TransactionTest.java
        db
        BlockIndexTest.java
        BlockSuite.java
        BlockTest.java
        BrowsableRecordTest.java
        DatabaseTest.java
        PrimaryBlockTest.java
        PrimaryRecordTest.java
        RecordSuite.java
        RecordTest.java
        RevisionTest.java
        SearchBlockTest.java
        SearchRecordTest.java
        SecondaryBlockTest.java
        SecondaryRecordTest.java
        temp
        BufferTest.java
        LimboTest.java
        QueueTest.java
        WriteTest.java
        util
        AutoHashMapTest.java
        AutoMapSuite.java
        AutoMapTest.java
        AutoSkipListMapTest.java
        LongBitSetTest.java
        NaturalSorterTest.java
        TArraysTest.java
        TCollectionsTest.java
        google
        common
        collect
        AbstractMultimapTest.java
- concourse-shell
  - src
    - main
      - java
        com
        cinchapi
        concourse
        shell
        CommandLine.java
        ConcourseShell.java
        EvaluationException.java
        ExitRequest.java
        HelpRequest.java
        IrregularEvaluationResult.java
        MultiLineRequest.java
        NewLineRequest.java
        ProgramCrash.java
        SyntaxTools.java
    - test
      - java
        com
        cinchapi
        concourse
        shell
        SyntaxToolsTest.java
- concourse-unit-test-core
  - src
    - main
      - java
        com
        cinchapi
        concourse
        test
        ConcourseBaseTest.java
        ConcourseBenchmarkTest.java
        Variables.java
- concourse-upgrade-tests
  - src
    - test
      - java
        com
        cinchapi
        concouse
        server
        upgrade
        UpgradeTask0_5_0_2Test.java
- examples
  - bank-overdraft-protection
    - java
      - src
        main
        java
        com
        cinchapi
        concourse
        example
        DatabaseObject.java
        bank
        Account.java
        ConcourseAccount.java
        ConcourseCustomer.java
        Constants.java
        Customer.java
        SqlAccount.java
        SqlCustomer.java
        test
        java
        com
        cinchapi
        concourse
        example
        bank
        ConcourseBankTest.java
  - mock-twitter-cli
    - java
      - src
        main
        java
        com
        cinchapi
        concourse
        example
        mocktwitter
        ConcourseTwitter.java
        MysqlTwitter.java
        Twitter.java
        TwitterCLI.java

/*
 * Copyright (c) 2013-2017 Cinchapi Inc.
 * 
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 * 
 * http://www.apache.org/licenses/LICENSE-2.0
 * 
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package com.cinchapi.concourse.server.plugin.data;

import java.util.AbstractMap;
import java.util.AbstractSet;
import java.util.Collections;
import java.util.Iterator;
import java.util.Map;
import java.util.Objects;
import java.util.Set;
import java.util.concurrent.atomic.AtomicInteger;
import java.util.concurrent.atomic.AtomicLong;

import javax.annotation.Nullable;
import javax.annotation.concurrent.NotThreadSafe;

import org.apache.commons.math3.stat.StatUtils;
import org.apache.commons.math3.stat.descriptive.DescriptiveStatistics;

import com.cinchapi.concourse.Link;
import com.cinchapi.concourse.thrift.TObject;
import com.cinchapi.concourse.thrift.Type;
import com.google.common.base.MoreObjects;
import com.google.common.base.Preconditions;
import com.google.common.collect.Maps;
import com.google.common.collect.Sets;
import com.zaxxer.sparsebits.SparseBitSet;

/**
 * <p>
 * An implementation of a {@code Map} that characterizes entries on the fly as
 * they are added or removed. This is used to characterize user data as it is
 * being entered, so that the visualization engine can query this map to
 * immediately view data characterization in constant time.
 * </p>
 * <p>
 * Apart from {@link #put(Object, Set)}, {@link #remove(Object)},
 * {@link #putAll(Map)}, and {@link #clear()}, all methods are delegated to an
 * internal map. The four aforementioned methods are overridden in terms of
 * functionality to characterize the entries in the map before performing the
 * original intended function.
 * </p>
 * <p>
 * {@link TrackingMultimap} is parametrized by type-parameters K and V, but the
 * underlying internal map is in the form {@code Map<K, Set<V>>}. This is to
 * comply with the format of data, which is either a Map from Strings (keys) to
 * Objects (values), or Objects (values) to Longs (records).
 * </p>
 * 
 * @author Jeff Nelson
 */
// TODO talk about what is tracked for keys and what is tracked for values
@NotThreadSafe
public abstract class TrackingMultimap<K, V> extends AbstractMap<K, Set<V>> {

    /**
     * Return the correct {@link DataType} for the {@code obj}.
     * 
     * @param obj the object to categorize
     * @return the correct {@link DataType}
     */
    private static DataType getDataType(Object object) {
        Class<?> clazz = object.getClass();
        if(clazz == Link.class || isTObjectType(object, Type.LINK)) {
            return DataType.LINK;
        }
        else if(isTObjectType(object, Type.DOUBLE, Type.FLOAT, Type.INTEGER,
                Type.LONG) || Number.class.isAssignableFrom(clazz)
                || OTHER_NUMBER_CLASSES.contains(clazz)) {
            return DataType.NUMBER;
        }
        else if(isTObjectType(object, Type.STRING, Type.TAG)
                || clazz == String.class) {
            return DataType.STRING;
        }
        else if(isTObjectType(object, Type.BOOLEAN) || clazz == Boolean.class
                || clazz == boolean.class) {
            return DataType.BOOLEAN;
        }
        else {
            return DataType.UNKNOWN;
        }
    }

    /**
     * Return {@code true} if {@code obj} is an instance of {@link TObject} and
     * falls under any of the specified {@code types}.
     * 
     * @param obj the object to check
     * @param types the types for which to check
     * @return {@code true} if the ttype of the {@code obj} is any of the
     *         specified {@code types}
     */
    private static boolean isTObjectType(Object obj, Type... types) {
        if(obj instanceof TObject) {
            for (Type type : types) {
                if(type == ((TObject) obj).getType()) {
                    return true;
                }
            }
            return false;
        }
        else {
            return false;
        }
    }

    /**
     * Return a new {@link HashSet} that contains all of the {@code elements},
     * if the input is not {@code null}. Otherwise, return {@code null}.
     * 
     * @param elements the elements to include in the returned set
     * @return a set that includes all of the elements or {@code null}
     */
    @Nullable
    private static <V> Set<V> newHashSetNullSafe(
            Iterable<? extends V> elements) {
        return elements != null ? Sets.newHashSet(elements) : null;
    }

    /**
     * A collection of classes that don't extend {@link Number} should be
     * considered {@link DataType#NUMBER numerical}.
     */
    private static Set<Class<?>> OTHER_NUMBER_CLASSES = Sets
            .newIdentityHashSet();
    static {
        OTHER_NUMBER_CLASSES.add(int.class);
        OTHER_NUMBER_CLASSES.add(long.class);
        OTHER_NUMBER_CLASSES.add(float.class);
        OTHER_NUMBER_CLASSES.add(double.class);
        OTHER_NUMBER_CLASSES.add(short.class);
        OTHER_NUMBER_CLASSES.add(byte.class);
    }

    /**
     * An internal map where the data is actually stored.
     */
    private Map<K, Set<V>> data;

    /**
     * A mapping from each of the {@link DataType data types} to the number of
     * stored keys that are characterized as such.
     */
    private final Map<DataType, AtomicInteger> keyTypes;

    /**
     * The total number of values (including duplicates) added across all the
     * keys.
     */
    private final AtomicLong totalValueCount;

    /**
     * The total number of unique values (e.g. excluding duplicates) that are
     * stored across all the keys.
     */
    private final AtomicLong uniqueValueCount;

    /**
     * An approximate cache of values stored across all the keys.
     * <p>
     * Whenever a value is added to the map, the bit for its
     * {@link Object#hashCode() hash code} is flipped to indicate that the value
     * is stored. However, hash codes are not guaranteed to be unique among
     * objects, so its necessary to look through all the values and test the
     * equality for a potential match to determine if an object is actually
     * contained or not.
     * </p>
     */
    private final SparseBitSet valueCache;

    /**
     * Construct a new instance.
     * 
     * @param delegate an {@link Map#isEmpty() empty} map
     */
    protected TrackingMultimap(Map<K, Set<V>> delegate) {
        Preconditions.checkState(delegate.isEmpty());
        this.data = delegate;
        this.keyTypes = Maps.newIdentityHashMap();
        for (DataType type : DataType.values()) {
            this.keyTypes.put(type, new AtomicInteger(0));
        }
        this.totalValueCount = new AtomicLong(0);
        this.uniqueValueCount = new AtomicLong(0);
        this.valueCache = new SparseBitSet();
    }

    /**
     * Returns whether the {@link TrackingMultimap} contains values of the
     * specified {@link DataType}.
     * 
     * @param type the {@link DataType} being queried
     * @return {@code true} if the {@code Map} contains this {@link DataType},
     *         false otherwise
     */
    public boolean containsDataType(DataType type) {
        return percentKeyDataType(type) > 0;
    }

    /**
     * Remove the association between {@code key} and {@code value} from the
     * map.
     * 
     * @param key the key
     * @param value the value
     * @return {@code true} if the association previously existed and is removed
     */
    public boolean delete(K key, V value) {
        Set<V> values = data.get(key);
        if(values != null && values.remove(value)) {
            if(values.isEmpty()) {
                data.remove(values);
            }
            return true;
        }
        else {
            return false;
        }
    }

    /**
     * The {@code distinctiveness} is a measure of how the number of unique keys
     * in the map relative to the total number of values, expressed as a number
     * between 0 and 1.
     * <p>
     * The {@link #keySet()} reveals the total number of unique keys; however,
     * this method takes that value and divides it by the total number of values
     * across all of the keys to get a mathematical measure of how much
     * duplication exists among the data in the map duplication
     * </p>
     * <p>
     * A distinctiveness of 1 means that the keys are completely distinct (e.g.
     * no key maps to more than 1 value). Lower measures of distinctiveness mean
     * that they are less distinct (e.g. on average, each key maps to more
     * values as the distinctiveness gets closer to 0).
     * </p>
     * 
     * @return the distinctiveness of the data, on a scale from 0 to 1
     */
    public double distinctiveness() {
        double tvc = totalValueCount.get();
        return (tvc == 0) ? 0 : (double) data.size() / tvc;
    }

    @Override
    public Set<Entry<K, Set<V>>> entrySet() {
        return data.entrySet();
    }

    @SuppressWarnings("unchecked")
    @Override
    public boolean equals(Object obj) {
        if(obj instanceof TrackingMultimap) {
            return data.equals(((TrackingMultimap<K, V>) obj).data);
        }
        else {
            return false;
        }
    }

    @Override
    public Set<V> get(Object key) {
        return data.get(key);
    }

    @Override
    public int hashCode() {
        return data.hashCode();
    }

    /**
     * Return {@code true} if this map associates {@code value} with at least
     * one key.
     * <p>
     * This method is different from {@link #containsValue(Object)} because it
     * checks for values <strong>within</strong> the Sets that are mapped from
     * keys. Use the aforementioned if you need to check for the existence of an
     * entire Set as opposed to an individual value.
     * </p>
     * 
     * @param value the value to checks
     * @return {@code true} if the value is contained, {@code false} otherwise
     */
    public boolean hasValue(V value) {
        int hashCode = Math.abs(value.hashCode());
        if(valueCache.get(hashCode)) {
            for (Set<V> values : data.values()) {
                if(values.contains(value)) {
                    return true;
                }
            }
            return false;
        }
        else {
            return false;
        }
    }

    /**
     * Add a new association between {@code key} and {@code value} to the map if
     * it doesn't already exist.
     * 
     * @param key the key
     * @param value the value
     * @return {@code true} if the association didn't previously exist and is
     *         not added
     */
    public boolean insert(K key, V value) {
        Set<V> values = data.get(key);
        if(values == null) {
            values = new ValueSetWrapper(key);
            data.put(key, values);
        }
        if(values.add(value)) {
            return true;
        }
        else {
            return false;
        }
    }

    /**
     * Merge all the {@code values} into the set of values that is mapped from
     * {@code key}.
     * 
     * @param key the key
     * @param values the values to merge
     * @return all the values mapped from {@code key} after the merge
     */
    public Set<V> merge(K key, Set<V> values) {
        for (V value : values) {
            insert(key, value);
        }
        return get(key);
    }

    /**
     * Return the percent (between 0 and 1) of keys that are an instance of the
     * specified {@link DataType type}.
     * 
     * @param type the {@link DataType} of interest
     * @return the percent of keys of the {@code type}
     */
    public double percentKeyDataType(DataType type) {
        return ((double) keyTypes.get(type).get()) / totalValueCount.get();
    }

    /**
     * Determines the proportion of occurrence of a particular key. This is
     * merely the frequency of that key divided by the total number of key
     * frequencies.
     * 
     * @param element the key for which the proportion is being sought
     * @return the proportion of the key
     */
    public double proportion(K element) {
        double frequency = data.get(element).size();
        return frequency / totalValueCount.get();
    }

    /**
     * <p>
     * <strong>NOTE:</strong> This implementation will replace all the existing
     * values mapped from {@code key} with those specified in the {@code value}.
     * If you want "merge-like" functionality call the {@link #merge(Set)}
     * method.
     * </p>
     * {@inheritDoc}
     */
    @Override
    public Set<V> put(K key, Set<V> value) {
        Set<V> stored = newHashSetNullSafe(data.get(key));
        if(stored == null) {
            data.put(key, new ValueSetWrapper(key));
        }
        for (V element : MoreObjects.firstNonNull(stored,
                Collections.<V> emptySet())) {
            delete(key, element);
        }
        for (V element : value) {
            insert(key, element);
        }
        return stored;
    }

    @SuppressWarnings("unchecked")
    @Override
    public Set<V> remove(Object key) {
        Set<V> stored = newHashSetNullSafe(data.get(key));
        if(stored != null) {
            for (V element : stored) {
                delete((K) key, element); // type cast is valid because the
                                          // presence of elements over which to
                                          // iterate ensures that #put(K key, V
                                          // value) was called, which performs
                                          // type checking
            }
        }
        Set<V> values = data.get(key);
        if(values != null && values.isEmpty()) {
            data.remove(key);
        }
        return stored;

    }

    /**
     * Return a relative measure of the statistical dispersion in this data.
     * <p>
     * There are several ways to measure statistical dispersion, so callers
     * should not rely on a specific underlying implementation because it may
     * change over time. This method simply offers a value that allows for
     * comparison of dispersion across data sets.
     * </p>
     * <p>
     * A larger dispersion value means that the data is more spread out whereas
     * a smaller dispersion value indicates the opposite.
     * </p>
     * 
     * @return the dispersion value for this data
     */
    public double spread() {
        // Get the quartile coefficient of dispersion, which is a cross
        // dataset mechanism for comparing the relative dispersion of data.
        double[] frequencies = new double[size()];
        AtomicInteger index = new AtomicInteger(0);
        data.values().forEach(
                records -> frequencies[index.getAndIncrement()] = records
                        .size());
        DescriptiveStatistics stats = new DescriptiveStatistics(frequencies);
        double p1 = stats.getPercentile(25);
        double p3 = stats.getPercentile(75);
        double coefficientOfDispersion = (p3 - p1) / (p3 + p1);

        // Grab the coefficient of variance
        double coefficientOfVariance = stats.getStandardDeviation()
                / stats.getMean();

        // Calculate the average absolute deviation from the mean
        double[] deviations = new double[frequencies.length];
        for (int i = 0; i < deviations.length; ++i) {
            deviations[i] = Math.abs(frequencies[i] - stats.getMean());
        }
        double averageAbsoluteDeviation = StatUtils.mean(deviations)
                / stats.getMean();

        // Apply a weighting to the various components
        return (0.50 * coefficientOfDispersion) + (0.40 * coefficientOfVariance)
                + (0.10 * averageAbsoluteDeviation);
    }

    @Override
    public String toString() {
        return data.toString();
    }

    /**
     * Calculates the uniqueness of the data by summing the squares of the
     * proportions of each key within the {@link #keySet() key set},
     * determining the square root of the sum, and subtracting it from 1. This
     * always results in a number between 0 and 1.
     * <p>
     * For datasets with a large number of distinct values appearing in
     * relatively similar frequency, this function returns a relatively high
     * number, since there are many unique values. Mathematically, each
     * contributes a small amount to the proportion, so the square root term is
     * small, returning a large end result.
     * </p>
     * <p>
     * Conversely, for datasets with a few dominating values, this function
     * returns a fairly low number. This is because the higher proportions from
     * the dominating values contribute more heavily towards the sum of squares.
     * The square root is therefore higher, and when subtracted from 1, returns
     * a lower number.
     * </p>
     * 
     * @return the uniqueness of the data, on a scale from 0 to 1
     */
    public double uniqueness() {
        double sumOfSquares = 0;
        for (K key : this.keySet()) {
            sumOfSquares += Math.pow(proportion(key), 2);
        }
        return 1 - Math.sqrt(sumOfSquares);
    }

    /**
     * Determines how many unique values exist within the {@link Map} and
     * returns the appropriate {@link VariableType}.
     * 
     * The three possible return types are:
     * <ol>
     * <li><strong>DICHOTOMOUS</strong>: if there are 1 or 2 unique values</li>
     * <li><strong>NOMINAL</strong>: if the number of unique values is greater
     * than 2 and less than or equal to 12</li>
     * <li><strong>INTERVAL</strong>: if there are more than 12 unique
     * values</li>
     * </ol>
     * 
     * @return
     */
    public VariableType variableType() {
        // NOTE: The boundary between nominal and interval is arbitrary, and may
        // require tweaking since it is a heuristic model.
        if(data.keySet().size() <= 2) {
            return VariableType.DICHOTOMOUS;
        }
        else if(data.keySet().size() <= 12) {
            return VariableType.NOMINAL;
        }
        else {
            return VariableType.INTERVAL;
        }
    }

    /**
     * Return a new {@link Set} (of the appropriate type) to use for storing the
     * values that are mapped from a key.
     * 
     * @return a new {@link Set}
     */
    protected abstract Set<V> createValueSet();

    /**
     * A broad classification of objects that describes the nature of the data.
     * 
     * @author Jeff Nelson
     */
    public static enum DataType {
        BOOLEAN, LINK, NUMBER, STRING, UNKNOWN;
    }

    /**
     * A classification of objects that describes how data is categorized
     */
    public static enum VariableType {
        DICHOTOMOUS, INTERVAL, NOMINAL;
    }

    /**
     * An internal wrapper around a Set returned from the
     * {@link #createValueSet()} method.
     * <p>
     * The wrapper is responsible for tracking stats for the individual set and
     * updating the appropriate variables of the outer class. This ensures that
     * the caller can interact with individual value sets without breaking
     * tracking semantics.
     * </p>
     * 
     * @author Jeff Nelson
     */
    private class ValueSetWrapper extends AbstractSet<V> {

        /**
         * The key from which this {@link Set} is mapped in the outer
         * TrackingMultimap.
         */
        private K key;

        /**
         * The wrapped set that actually stores the data.
         */
        private final Set<V> values = createValueSet();

        /**
         * Construct a new instance.
         * 
         * @param key
         */
        ValueSetWrapper(K key) {
            this.key = key;
        }

        @Override
        public boolean add(V element) {
            boolean contained = hasValue(element);
            if(values.add(element)) {
                totalValueCount.incrementAndGet();
                DataType keyType = getDataType(key);
                keyTypes.get(keyType).incrementAndGet();
                if(!contained) {
                    // The value was not previously contained, so we must update
                    // the number of unique values stored across all the keys.
                    uniqueValueCount.incrementAndGet();
                    valueCache.set(Math.abs(element.hashCode()));
                }
                return true;
            }
            else {
                return false;
            }
        }

        @SuppressWarnings("unchecked")
        @Override
        public boolean equals(Object obj) {
            if(obj instanceof TrackingMultimap.ValueSetWrapper) {
                return values.equals(((ValueSetWrapper) obj).values);
            }
            else if(obj instanceof Set) {
                return Objects.equals(values, obj);
            }
            else {
                return false;
            }
        }

        @Override
        public int hashCode() {
            return values.hashCode();
        }

        @Override
        public Iterator<V> iterator() {

            return new Iterator<V>() {

                /**
                 * The delegate iterator that controls state.
                 */
                private final Iterator<V> delegate = values.iterator();

                /**
                 * The last value returned from the {@link #next()} method.
                 */
                private V next = null;

                @Override
                public boolean hasNext() {
                    return delegate.hasNext();
                }

                @Override
                public V next() {
                    next = delegate.next();
                    return next;
                }

                @Override
                public void remove() {
                    ValueSetWrapper.this.remove(next);
                    next = null;
                }

            };
        }

        @SuppressWarnings("unchecked")
        @Override
        public boolean remove(Object element) {
            if(values.remove(element)) {
                totalValueCount.decrementAndGet();
                DataType keyType = getDataType(key);
                keyTypes.get(keyType).decrementAndGet();
                boolean contained = hasValue((V) element);
                if(!contained) {
                    // Since the value is no longer "contained" we are free to
                    // decrement the number of unique values stored across all
                    // the keys
                    uniqueValueCount.decrementAndGet();
                }
                return true;
            }
            else {
                return false;
            }
        }

        @Override
        public int size() {
            return values.size();
        }

        @Override
        public String toString() {
            return values.toString();
        }
    }
}